Train size: 80 Test size: 20
	Tokenizer: ../home/arg_mining/4epoch_complete/tokenizer Model: ../home/arg_mining/4epoch_complete/model/


		-------------RUN 1-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.6, 'contradicts': 0.0, 'parts_of_same': 0.13254901960784313}, 'recall': {'supports': 0.0030643513789581204, 'contradicts': 0.0, 'parts_of_same': 0.9941176470588236}, 'f1': {'supports': 0.006097560975609756, 'contradicts': 0.0, 'parts_of_same': 0.2339100346020761}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.134375, 'recall': 0.134375, 'f1': 0.134375, 'support': None}, 'macro_avg': {'precision': 0.2441830065359477, 'recall': 0.33239399947926057, 'f1': 0.08000253185922862, 'support': None}, 'weighted_avg': {'precision': 0.4765104166666666, 'recall': 0.134375, 'f1': 0.03572985787302725, 'support': None}}
Loss: tensor(2.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9546742209631728, 'contradicts': 0.3323615160349854, 'parts_of_same': 0.5324675324675324}, 'recall': {'supports': 0.6884576098059244, 'contradicts': 0.8702290076335878, 'parts_of_same': 0.7235294117647059}, 'f1': {'supports': 0.8, 'contradicts': 0.48101265822784806, 'parts_of_same': 0.6134663341645885}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.71171875, 'recall': 0.71171875, 'f1': 0.71171875, 'support': None}, 'macro_avg': {'precision': 0.6065010898218969, 'recall': 0.760738676401406, 'f1': 0.6314929974641456, 'support': None}, 'weighted_avg': {'precision': 0.8349100792523514, 'recall': 0.71171875, 'f1': 0.7425796367467408, 'support': None}}
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9595300261096605, 'contradicts': 0.35855263157894735, 'parts_of_same': 0.6333333333333333}, 'recall': {'supports': 0.7507660878447395, 'contradicts': 0.8320610687022901, 'parts_of_same': 0.7823529411764706}, 'f1': {'supports': 0.8424068767908309, 'contradicts': 0.5011494252873564, 'parts_of_same': 0.7000000000000001}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.76328125, 'recall': 0.76328125, 'f1': 0.76328125, 'support': None}, 'macro_avg': {'precision': 0.6504719970073137, 'recall': 0.7883933659078334, 'f1': 0.6811854340260625, 'support': None}, 'weighted_avg': {'precision': 0.854700747628802, 'recall': 0.76328125, 'f1': 0.78856789616474, 'support': None}}
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9521640091116174, 'contradicts': 0.580110497237569, 'parts_of_same': 0.6018099547511312}, 'recall': {'supports': 0.8539325842696629, 'contradicts': 0.8015267175572519, 'parts_of_same': 0.7823529411764706}, 'f1': {'supports': 0.9003769520732363, 'contradicts': 0.673076923076923, 'parts_of_same': 0.6803069053708439}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8390625, 'recall': 0.8390625, 'f1': 0.8390625000000002, 'support': None}, 'macro_avg': {'precision': 0.7113614870334392, 'recall': 0.8126040810011285, 'f1': 0.751253593507001, 'support': None}, 'weighted_avg': {'precision': 0.8675552596610057, 'recall': 0.8390625, 'f1': 0.8478861616529834, 'support': None}}
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9329608938547486, 'contradicts': 0.538860103626943, 'parts_of_same': 0.609375}, 'recall': {'supports': 0.8529111338100103, 'contradicts': 0.7938931297709924, 'parts_of_same': 0.6882352941176471}, 'f1': {'supports': 0.8911419423692636, 'contradicts': 0.6419753086419753, 'parts_of_same': 0.6464088397790055}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.825, 'recall': 0.825, 'f1': 0.825, 'support': None}, 'macro_avg': {'precision': 0.6937319991605638, 'recall': 0.7783465192328833, 'f1': 0.7265086969300815, 'support': None}, 'weighted_avg': {'precision': 0.8496508895772878, 'recall': 0.825, 'f1': 0.8331376795109678, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.933570581257414, 'contradicts': 0.4343891402714932, 'parts_of_same': 0.5648148148148148}, 'recall': {'supports': 0.8038815117466803, 'contradicts': 0.732824427480916, 'parts_of_same': 0.7176470588235294}, 'f1': {'supports': 0.8638858397365533, 'contradicts': 0.5454545454545454, 'parts_of_same': 0.6321243523316061}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.78515625, 'recall': 0.78515625, 'f1': 0.78515625, 'support': None}, 'macro_avg': {'precision': 0.6442581787812407, 'recall': 0.7514509993503752, 'f1': 0.6804882458409017, 'support': None}, 'weighted_avg': {'precision': 0.8335071054258535, 'recall': 0.78515625, 'f1': 0.8005155644164095, 'support': None}}
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9305103148751357, 'contradicts': 0.6212121212121212, 'parts_of_same': 0.5859030837004405}, 'recall': {'supports': 0.8753830439223698, 'contradicts': 0.6259541984732825, 'parts_of_same': 0.7823529411764706}, 'f1': {'supports': 0.9021052631578947, 'contradicts': 0.623574144486692, 'parts_of_same': 0.6700251889168766}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8375, 'recall': 0.8375, 'f1': 0.8375, 'support': None}, 'macro_avg': {'precision': 0.7125418399292324, 'recall': 0.7612300611907076, 'f1': 0.7319015321871545, 'support': None}, 'weighted_avg': {'precision': 0.8530874299770475, 'recall': 0.8375, 'f1': 0.8427762091212536, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.921161825726141, 'contradicts': 0.5947712418300654, 'parts_of_same': 0.6993865030674846}, 'recall': {'supports': 0.9061224489795918, 'contradicts': 0.6946564885496184, 'parts_of_same': 0.6745562130177515}, 'f1': {'supports': 0.9135802469135802, 'contradicts': 0.6408450704225352, 'parts_of_same': 0.6867469879518073}, 'support': {'supports': 980, 'contradicts': 131, 'parts_of_same': 169}, 'micro_avg': {'precision': 0.85390625, 'recall': 0.85390625, 'f1': 0.85390625, 'support': None}, 'macro_avg': {'precision': 0.7384398568745637, 'recall': 0.7584450501823206, 'f1': 0.7470574350959742, 'support': None}, 'weighted_avg': {'precision': 0.8584765163357513, 'recall': 0.85390625, 'f1': 0.8557184274722781, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9455555555555556, 'contradicts': 0.5393258426966292, 'parts_of_same': 0.6287128712871287}, 'recall': {'supports': 0.8692543411644535, 'contradicts': 0.732824427480916, 'parts_of_same': 0.7470588235294118}, 'f1': {'supports': 0.9058009579563597, 'contradicts': 0.6213592233009709, 'parts_of_same': 0.6827956989247311}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8390625, 'recall': 0.8390625, 'f1': 0.8390625000000002, 'support': None}, 'macro_avg': {'precision': 0.7045314231797711, 'recall': 0.7830458640582605, 'f1': 0.7366519600606872, 'support': None}, 'weighted_avg': {'precision': 0.8618998143757495, 'recall': 0.8390625, 'f1': 0.847072238210084, 'support': None}}
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9071428571428571, 'contradicts': 0.5882352941176471, 'parts_of_same': 0.6938775510204082}, 'recall': {'supports': 0.9080694586312564, 'contradicts': 0.6870229007633588, 'parts_of_same': 0.6}, 'f1': {'supports': 0.9076059213884635, 'contradicts': 0.6338028169014084, 'parts_of_same': 0.6435331230283912}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.84453125, 'recall': 0.84453125, 'f1': 0.84453125, 'support': None}, 'macro_avg': {'precision': 0.729751900760304, 'recall': 0.7316974531315384, 'f1': 0.7283139537727544, 'support': None}, 'weighted_avg': {'precision': 0.846180362770108, 'recall': 0.84453125, 'f1': 0.8445117163814194, 'support': None}}
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9277238403451996, 'contradicts': 0.5915492957746479, 'parts_of_same': 0.6255924170616114}, 'recall': {'supports': 0.8784473953013279, 'contradicts': 0.6412213740458015, 'parts_of_same': 0.7764705882352941}, 'f1': {'supports': 0.9024134312696747, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.6929133858267716}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.840625, 'recall': 0.840625, 'f1': 0.840625, 'support': None}, 'macro_avg': {'precision': 0.7149551843938197, 'recall': 0.7653797858608078, 'f1': 0.7369038108270206, 'support': None}, 'weighted_avg': {'precision': 0.8531916471444557, 'recall': 0.840625, 'f1': 0.8452136011085527, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9498164014687882, 'contradicts': 0.45662100456621, 'parts_of_same': 0.5368852459016393}, 'recall': {'supports': 0.7926455566905005, 'contradicts': 0.7633587786259542, 'parts_of_same': 0.7705882352941177}, 'f1': {'supports': 0.864142538975501, 'contradicts': 0.5714285714285714, 'parts_of_same': 0.6328502415458938}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.78671875, 'recall': 0.78671875, 'f1': 0.7867187499999999, 'support': None}, 'macro_avg': {'precision': 0.6477742173122125, 'recall': 0.7755308568701907, 'f1': 0.6894737839833222, 'support': None}, 'weighted_avg': {'precision': 0.8444985159682782, 'recall': 0.78671875, 'f1': 0.8034665856070002, 'support': None}}
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9322235434007135, 'contradicts': 0.618421052631579, 'parts_of_same': 0.45993031358885017}, 'recall': {'supports': 0.8, 'contradicts': 0.7230769230769231, 'parts_of_same': 0.7764705882352941}, 'f1': {'supports': 0.8610653487095002, 'contradicts': 0.6666666666666667, 'parts_of_same': 0.5776805251641137}, 'support': {'supports': 980, 'contradicts': 130, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.7890625, 'recall': 0.7890625, 'f1': 0.7890625, 'support': None}, 'macro_avg': {'precision': 0.6701916365403809, 'recall': 0.7665158371040723, 'f1': 0.7018041801800935, 'support': None}, 'weighted_avg': {'precision': 0.8376265333475852, 'recall': 0.7890625, 'f1': 0.8036846856874034, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9044265593561368, 'contradicts': 0.6304347826086957, 'parts_of_same': 0.7162162162162162}, 'recall': {'supports': 0.9182839632277835, 'contradicts': 0.6641221374045801, 'parts_of_same': 0.6235294117647059}, 'f1': {'supports': 0.9113025848960973, 'contradicts': 0.6468401486988848, 'parts_of_same': 0.6666666666666666}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.853125, 'recall': 0.853125, 'f1': 0.853125, 'support': None}, 'macro_avg': {'precision': 0.7503591860603495, 'recall': 0.7353118374656898, 'f1': 0.7416031334205496, 'support': None}, 'weighted_avg': {'precision': 0.8513885272563702, 'recall': 0.853125, 'f1': 0.8517457995516926, 'support': None}}
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9128672745694022, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.686046511627907}, 'recall': {'supports': 0.9203268641470889, 'contradicts': 0.5877862595419847, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.9165818921668363, 'contradicts': 0.6111111111111112, 'parts_of_same': 0.6900584795321637}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.85625, 'recall': 0.85625, 'f1': 0.85625, 'support': None}, 'macro_avg': {'precision': 0.7450924741869818, 'recall': 0.7340769235826322, 'f1': 0.7392504942700371, 'support': None}, 'weighted_avg': {'precision': 0.8544442227686135, 'recall': 0.85625, 'f1': 0.855233726177622, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9438202247191011, 'contradicts': 0.5695364238410596, 'parts_of_same': 0.5815899581589958}, 'recall': {'supports': 0.8571428571428571, 'contradicts': 0.6615384615384615, 'parts_of_same': 0.8176470588235294}, 'f1': {'supports': 0.8983957219251337, 'contradicts': 0.6120996441281139, 'parts_of_same': 0.6797066014669927}, 'support': {'supports': 980, 'contradicts': 130, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.83203125, 'recall': 0.83203125, 'f1': 0.83203125, 'support': None}, 'macro_avg': {'precision': 0.6983155355730521, 'recall': 0.7787761258349493, 'f1': 0.7300673225067468, 'support': None}, 'weighted_avg': {'precision': 0.8576983189149111, 'recall': 0.83203125, 'f1': 0.840274127713027, 'support': None}}
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9222343921139102, 'contradicts': 0.6176470588235294, 'parts_of_same': 0.5584415584415584}, 'recall': {'supports': 0.8600612870275791, 'contradicts': 0.6412213740458015, 'parts_of_same': 0.7588235294117647}, 'f1': {'supports': 0.8900634249471459, 'contradicts': 0.6292134831460674, 'parts_of_same': 0.6433915211970074}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.82421875, 'recall': 0.82421875, 'f1': 0.82421875, 'support': None}, 'macro_avg': {'precision': 0.6994410031263327, 'recall': 0.7533687301617151, 'f1': 0.7208894764300734, 'support': None}, 'weighted_avg': {'precision': 0.8427455465003636, 'recall': 0.82421875, 'f1': 0.8306059514991265, 'support': None}}
Loss: tensor(0.5816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9427942794279428, 'contradicts': 0.5642458100558659, 'parts_of_same': 0.671875}, 'recall': {'supports': 0.8753830439223698, 'contradicts': 0.7709923664122137, 'parts_of_same': 0.7588235294117647}, 'f1': {'supports': 0.9078389830508474, 'contradicts': 0.6516129032258065, 'parts_of_same': 0.712707182320442}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.84921875, 'recall': 0.84921875, 'f1': 0.84921875, 'support': None}, 'macro_avg': {'precision': 0.7263050298279362, 'recall': 0.8017329799154495, 'f1': 0.7573863561990319, 'support': None}, 'weighted_avg': {'precision': 0.8680707427166207, 'recall': 0.84921875, 'f1': 0.8556999029092465, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9166666666666666, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.6954022988505747}, 'recall': {'supports': 0.9101123595505618, 'contradicts': 0.6564885496183206, 'parts_of_same': 0.711764705882353}, 'f1': {'supports': 0.9133777549974371, 'contradicts': 0.649056603773585, 'parts_of_same': 0.7034883720930233}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8578125, 'recall': 0.8578125, 'f1': 0.8578125, 'support': None}, 'macro_avg': {'precision': 0.7512866700977869, 'recall': 0.7594552050170784, 'f1': 0.7553075769546819, 'support': None}, 'weighted_avg': {'precision': 0.8591481908882311, 'recall': 0.8578125, 'f1': 0.8584502035098787, 'support': None}}
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.91353001017294, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.7125748502994012}, 'recall': {'supports': 0.9172625127681308, 'contradicts': 0.6412213740458015, 'parts_of_same': 0.7}, 'f1': {'supports': 0.9153924566768604, 'contradicts': 0.6436781609195402, 'parts_of_same': 0.7062314540059347}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.86015625, 'recall': 0.86015625, 'f1': 0.86015625, 'support': None}, 'macro_avg': {'precision': 0.7574195688753957, 'recall': 0.7528279622713109, 'f1': 0.7551006905341118, 'support': None}, 'weighted_avg': {'precision': 0.8594763737159065, 'recall': 0.86015625, 'f1': 0.8598050010532148, 'support': None}}
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9134419551934827, 'contradicts': 0.6439393939393939, 'parts_of_same': 0.7108433734939759}, 'recall': {'supports': 0.916241062308478, 'contradicts': 0.648854961832061, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.9148393676695563, 'contradicts': 0.6463878326996197, 'parts_of_same': 0.7023809523809523}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.859375, 'recall': 0.859375, 'f1': 0.859375, 'support': None}, 'macro_avg': {'precision': 0.7560749075422842, 'recall': 0.7530712237331209, 'f1': 0.7545360509167095, 'support': None}, 'weighted_avg': {'precision': 0.8589524283081689, 'recall': 0.859375, 'f1': 0.8591478976069592, 'support': None}}
Loss: tensor(7.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9126016260162602, 'contradicts': 0.6439393939393939, 'parts_of_same': 0.7195121951219512}, 'recall': {'supports': 0.9172625127681308, 'contradicts': 0.648854961832061, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.91492613346918, 'contradicts': 0.6463878326996197, 'parts_of_same': 0.7065868263473054}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.86015625, 'recall': 0.86015625, 'f1': 0.86015625, 'support': None}, 'macro_avg': {'precision': 0.7586844050258685, 'recall': 0.7534117072196717, 'f1': 0.7559669308387017, 'support': None}, 'weighted_avg': {'precision': 0.8594610356614929, 'recall': 0.86015625, 'f1': 0.8597728525226712, 'support': None}}
Loss: tensor(1.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9153924566768603, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.7195121951219512}, 'recall': {'supports': 0.9163265306122449, 'contradicts': 0.6692307692307692, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.915859255481897, 'contradicts': 0.6566037735849056, 'parts_of_same': 0.7065868263473054}, 'support': {'supports': 980, 'contradicts': 130, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.86171875, 'recall': 0.86171875, 'f1': 0.86171875, 'support': None}, 'macro_avg': {'precision': 0.7597830320810853, 'recall': 0.7598916489672792, 'f1': 0.7596832851380361, 'support': None}, 'weighted_avg': {'precision': 0.8618589519467443, 'recall': 0.86171875, 'f1': 0.8617346261072958, 'support': None}}
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3446e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9134419551934827, 'contradicts': 0.6466165413533834, 'parts_of_same': 0.7151515151515152}, 'recall': {'supports': 0.916241062308478, 'contradicts': 0.6564885496183206, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.9148393676695563, 'contradicts': 0.6515151515151516, 'parts_of_same': 0.7044776119402986}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.86015625, 'recall': 0.86015625, 'f1': 0.86015625, 'support': None}, 'macro_avg': {'precision': 0.7584033372327937, 'recall': 0.7556157529952073, 'f1': 0.7569440437083355, 'support': None}, 'weighted_avg': {'precision': 0.8597985926777112, 'recall': 0.86015625, 'f1': 0.8599511092397119, 'support': None}}
Loss: tensor(6.4639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9134419551934827, 'contradicts': 0.6466165413533834, 'parts_of_same': 0.7151515151515152}, 'recall': {'supports': 0.916241062308478, 'contradicts': 0.6564885496183206, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.9148393676695563, 'contradicts': 0.6515151515151516, 'parts_of_same': 0.7044776119402986}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.86015625, 'recall': 0.86015625, 'f1': 0.86015625, 'support': None}, 'macro_avg': {'precision': 0.7584033372327937, 'recall': 0.7556157529952073, 'f1': 0.7569440437083355, 'support': None}, 'weighted_avg': {'precision': 0.8597985926777112, 'recall': 0.86015625, 'f1': 0.8599511092397119, 'support': None}}
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9143730886850153, 'contradicts': 0.6492537313432836, 'parts_of_same': 0.7151515151515152}, 'recall': {'supports': 0.916241062308478, 'contradicts': 0.6641221374045801, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.9153061224489795, 'contradicts': 0.6566037735849057, 'parts_of_same': 0.7044776119402986}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7595927783932713, 'recall': 0.7581602822572938, 'f1': 0.7587958359913946, 'support': None}, 'weighted_avg': {'precision': 0.8607806642221544, 'recall': 0.8609375, 'f1': 0.8608288923804878, 'support': None}}
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9143730886850153, 'contradicts': 0.6492537313432836, 'parts_of_same': 0.7151515151515152}, 'recall': {'supports': 0.916241062308478, 'contradicts': 0.6641221374045801, 'parts_of_same': 0.6941176470588235}, 'f1': {'supports': 0.9153061224489795, 'contradicts': 0.6566037735849057, 'parts_of_same': 0.7044776119402986}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7595927783932713, 'recall': 0.7581602822572938, 'f1': 0.7587958359913946, 'support': None}, 'weighted_avg': {'precision': 0.8607806642221544, 'recall': 0.8609375, 'f1': 0.8608288923804878, 'support': None}}
Loss: tensor(2.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9152196118488254, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.7168674698795181}, 'recall': {'supports': 0.9152196118488254, 'contradicts': 0.6641221374045801, 'parts_of_same': 0.7}, 'f1': {'supports': 0.9152196118488254, 'contradicts': 0.6541353383458647, 'parts_of_same': 0.7083333333333334}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7588438420575959, 'recall': 0.7597805830844685, 'f1': 0.7592294278426746, 'support': None}, 'weighted_avg': {'precision': 0.8611638219544846, 'recall': 0.8609375, 'f1': 0.8610221843671679, 'support': None}}
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9153061224489796, 'contradicts': 0.6417910447761194, 'parts_of_same': 0.7168674698795181}, 'recall': {'supports': 0.9153061224489796, 'contradicts': 0.6615384615384615, 'parts_of_same': 0.7}, 'f1': {'supports': 0.9153061224489796, 'contradicts': 0.6515151515151515, 'parts_of_same': 0.7083333333333334}, 'support': {'supports': 980, 'contradicts': 130, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7579882123682057, 'recall': 0.7589481946624804, 'f1': 0.7583848690991548, 'support': None}, 'weighted_avg': {'precision': 0.8611721138284482, 'recall': 0.8609375, 'f1': 0.861026278409091, 'support': None}}
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9152196118488254, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.7168674698795181}, 'recall': {'supports': 0.9152196118488254, 'contradicts': 0.6641221374045801, 'parts_of_same': 0.7}, 'f1': {'supports': 0.9152196118488254, 'contradicts': 0.6541353383458647, 'parts_of_same': 0.7083333333333334}, 'support': {'supports': 979, 'contradicts': 131, 'parts_of_same': 170}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7588438420575959, 'recall': 0.7597805830844685, 'f1': 0.7592294278426746, 'support': None}, 'weighted_avg': {'precision': 0.8611638219544846, 'recall': 0.8609375, 'f1': 0.8610221843671679, 'support': None}}
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 2-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7053504144687265, 'contradicts': 0.0, 'parts_of_same': 0.0}, 'recall': {'supports': 0.9821615949632738, 'contradicts': 0.0, 'parts_of_same': 0.0}, 'f1': {'supports': 0.8210526315789474, 'contradicts': 0.0, 'parts_of_same': 0.0}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.6933333333333334, 'recall': 0.6933333333333334, 'f1': 0.6933333333333334, 'support': None}, 'macro_avg': {'precision': 0.23511680482290884, 'recall': 0.32738719832109126, 'f1': 0.2736842105263158, 'support': None}, 'weighted_avg': {'precision': 0.49792514443607133, 'recall': 0.6933333333333334, 'f1': 0.5796023391812866, 'support': None}}
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(11.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9380281690140845, 'contradicts': 0.3951219512195122, 'parts_of_same': 0.542528735632184}, 'recall': {'supports': 0.6988457502623295, 'contradicts': 0.648, 'parts_of_same': 0.8676470588235294}, 'f1': {'supports': 0.8009621166566445, 'contradicts': 0.4909090909090909, 'parts_of_same': 0.6676096181046677}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.7281481481481481, 'recall': 0.7281481481481481, 'f1': 0.7281481481481481, 'support': None}, 'macro_avg': {'precision': 0.6252262852885936, 'recall': 0.7381642696952864, 'f1': 0.6531602752234678, 'support': None}, 'weighted_avg': {'precision': 0.8080732630109745, 'recall': 0.7281481481481481, 'f1': 0.7453854441939912, 'support': None}}
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9351491569390402, 'contradicts': 0.4946808510638298, 'parts_of_same': 0.5882352941176471}, 'recall': {'supports': 0.7565582371458552, 'contradicts': 0.744, 'parts_of_same': 0.8455882352941176}, 'f1': {'supports': 0.8364269141531323, 'contradicts': 0.5942492012779552, 'parts_of_same': 0.693815987933635}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.7733333333333333, 'recall': 0.7733333333333333, 'f1': 0.7733333333333333, 'support': None}, 'macro_avg': {'precision': 0.6726884340401723, 'recall': 0.7820488241466577, 'f1': 0.7081640344549074, 'support': None}, 'weighted_avg': {'precision': 0.8244683355154696, 'recall': 0.7733333333333333, 'f1': 0.7852695911597246, 'support': None}}
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9224242424242424, 'contradicts': 0.5289855072463768, 'parts_of_same': 0.6149870801033591}, 'recall': {'supports': 0.7985309548793285, 'contradicts': 0.584, 'parts_of_same': 0.875}, 'f1': {'supports': 0.8560179977502812, 'contradicts': 0.5551330798479088, 'parts_of_same': 0.7223065250379362}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.794074074074074, 'recall': 0.794074074074074, 'f1': 0.794074074074074, 'support': None}, 'macro_avg': {'precision': 0.6887989432579928, 'recall': 0.7525103182931095, 'f1': 0.711152534212042, 'support': None}, 'weighted_avg': {'precision': 0.8240518349808992, 'recall': 0.794074074074074, 'f1': 0.801217897516537, 'support': None}}
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.8921971252566735, 'contradicts': 0.7037037037037037, 'parts_of_same': 0.7457627118644068}, 'recall': {'supports': 0.9118572927597062, 'contradicts': 0.456, 'parts_of_same': 0.8088235294117647}, 'f1': {'supports': 0.9019200830306177, 'contradicts': 0.5533980582524272, 'parts_of_same': 0.7760141093474426}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8488888888888889, 'recall': 0.8488888888888889, 'f1': 0.848888888888889, 'support': None}, 'macro_avg': {'precision': 0.7805545136082612, 'recall': 0.7255602740571568, 'f1': 0.7437774168768292, 'support': None}, 'weighted_avg': {'precision': 0.8452402081182899, 'recall': 0.8488888888888889, 'f1': 0.8442818030757308, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.8702807357212003, 'contradicts': 0.7349397590361446, 'parts_of_same': 0.8162393162393162}, 'recall': {'supports': 0.9433368310598111, 'contradicts': 0.488, 'parts_of_same': 0.7022058823529411}, 'f1': {'supports': 0.905337361530715, 'contradicts': 0.5865384615384616, 'parts_of_same': 0.7549407114624506}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8525925925925926, 'recall': 0.8525925925925926, 'f1': 0.8525925925925926, 'support': None}, 'macro_avg': {'precision': 0.8071532703322205, 'recall': 0.7111809044709174, 'f1': 0.7489388448438757, 'support': None}, 'weighted_avg': {'precision': 0.8468608185473453, 'recall': 0.8525925925925926, 'f1': 0.8455168049991597, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.8977035490605428, 'contradicts': 0.569620253164557, 'parts_of_same': 0.8162393162393162}, 'recall': {'supports': 0.9024134312696747, 'contradicts': 0.72, 'parts_of_same': 0.7022058823529411}, 'f1': {'supports': 0.9000523286237572, 'contradicts': 0.6360424028268551, 'parts_of_same': 0.7549407114624506}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7611877061548054, 'recall': 0.7748731045408719, 'f1': 0.763678480971021, 'support': None}, 'weighted_avg': {'precision': 0.8509119317906377, 'recall': 0.8451851851851852, 'f1': 0.8463696615182104, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9254079254079254, 'contradicts': 0.5269461077844312, 'parts_of_same': 0.7076923076923077}, 'recall': {'supports': 0.8331584470094439, 'contradicts': 0.704, 'parts_of_same': 0.8455882352941176}, 'f1': {'supports': 0.8768636112644947, 'contradicts': 0.6027397260273973, 'parts_of_same': 0.7705192629815745}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8237037037037037, 'recall': 0.8237037037037037, 'f1': 0.8237037037037037, 'support': None}, 'macro_avg': {'precision': 0.7200154469615548, 'recall': 0.7942488941011873, 'f1': 0.7500408667578222, 'support': None}, 'weighted_avg': {'precision': 0.8446476474660108, 'recall': 0.8237037037037037, 'f1': 0.8300553531996121, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.8928199791883454, 'contradicts': 0.7096774193548387, 'parts_of_same': 0.7331081081081081}, 'recall': {'supports': 0.9003147953830011, 'contradicts': 0.528, 'parts_of_same': 0.7977941176470589}, 'f1': {'supports': 0.8965517241379312, 'contradicts': 0.6055045871559633, 'parts_of_same': 0.7640845070422535}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7785351688837642, 'recall': 0.7420363043433533, 'f1': 0.7553802727787161, 'support': None}, 'weighted_avg': {'precision': 0.8436833503638915, 'recall': 0.8451851851851852, 'f1': 0.842913224009953, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9121844127332601, 'contradicts': 0.6630434782608695, 'parts_of_same': 0.6772334293948127}, 'recall': {'supports': 0.8719832109129066, 'contradicts': 0.488, 'parts_of_same': 0.8639705882352942}, 'f1': {'supports': 0.8916309012875536, 'contradicts': 0.5622119815668203, 'parts_of_same': 0.7592891760904685}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8348148148148148, 'recall': 0.8348148148148148, 'f1': 0.8348148148148148, 'support': None}, 'macro_avg': {'precision': 0.7508204401296474, 'recall': 0.7413179330494003, 'f1': 0.7377106863149475, 'support': None}, 'weighted_avg': {'precision': 0.8417775354909589, 'recall': 0.8348148148148148, 'f1': 0.834464742607036, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.8769883351007424, 'contradicts': 0.4117647058823529, 'parts_of_same': 0.8655913978494624}, 'recall': {'supports': 0.8677859391395593, 'contradicts': 0.728, 'parts_of_same': 0.5919117647058824}, 'f1': {'supports': 0.8723628691983123, 'contradicts': 0.5260115606936415, 'parts_of_same': 0.7030567685589519}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.7992592592592592, 'recall': 0.7992592592592592, 'f1': 0.7992592592592592, 'support': None}, 'macro_avg': {'precision': 0.718114812944186, 'recall': 0.7292325679484805, 'f1': 0.7004770661503019, 'support': None}, 'weighted_avg': {'precision': 0.8316158013343373, 'recall': 0.7992592592592592, 'f1': 0.8061812596153568, 'support': None}}
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9214975845410628, 'contradicts': 0.691358024691358, 'parts_of_same': 0.546485260770975}, 'recall': {'supports': 0.8006295907660022, 'contradicts': 0.448, 'parts_of_same': 0.8860294117647058}, 'f1': {'supports': 0.8568220101066818, 'contradicts': 0.5436893203883495, 'parts_of_same': 0.6760168302945302}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.7851851851851852, 'recall': 0.7851851851851852, 'f1': 0.7851851851851852, 'support': None}, 'macro_avg': {'precision': 0.719780290001132, 'recall': 0.7115530008435694, 'f1': 0.6921760535965205, 'support': None}, 'weighted_avg': {'precision': 0.8246303274694502, 'recall': 0.7851851851851852, 'f1': 0.7913993470520916, 'support': None}}
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9027777777777778, 'contradicts': 0.4306930693069307, 'parts_of_same': 0.7253521126760564}, 'recall': {'supports': 0.8184679958027282, 'contradicts': 0.696, 'parts_of_same': 0.7573529411764706}, 'f1': {'supports': 0.8585580627407815, 'contradicts': 0.5321100917431193, 'parts_of_same': 0.7410071942446043}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.7948148148148149, 'recall': 0.7948148148148149, 'f1': 0.7948148148148149, 'support': None}, 'macro_avg': {'precision': 0.6862743199202549, 'recall': 0.7572736456597329, 'f1': 0.7105584495761684, 'support': None}, 'weighted_avg': {'precision': 0.8233182448396118, 'recall': 0.7948148148148149, 'f1': 0.8046470756254719, 'support': None}}
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.8968421052631579, 'contradicts': 0.6236559139784946, 'parts_of_same': 0.7035830618892508}, 'recall': {'supports': 0.8940188877229801, 'contradicts': 0.464, 'parts_of_same': 0.7941176470588235}, 'f1': {'supports': 0.8954282711508145, 'contradicts': 0.5321100917431193, 'parts_of_same': 0.7461139896373056}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8340740740740741, 'recall': 0.8340740740740741, 'f1': 0.8340740740740741, 'support': None}, 'macro_avg': {'precision': 0.7413603603769677, 'recall': 0.7173788449272679, 'f1': 0.7245507841770799, 'support': None}, 'weighted_avg': {'precision': 0.8326089691829462, 'recall': 0.8340740740740741, 'f1': 0.8317036363377506, 'support': None}}
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.8800813008130082, 'contradicts': 0.591304347826087, 'parts_of_same': 0.796812749003984}, 'recall': {'supports': 0.9087093389296957, 'contradicts': 0.544, 'parts_of_same': 0.7352941176470589}, 'f1': {'supports': 0.8941662364481158, 'contradicts': 0.5666666666666667, 'parts_of_same': 0.7648183556405354}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.84, 'recall': 0.84, 'f1': 0.8399999999999999, 'support': None}, 'macro_avg': {'precision': 0.7560661325476931, 'recall': 0.7293344855255849, 'f1': 0.7418837529184392, 'support': None}, 'weighted_avg': {'precision': 0.8365656228756603, 'recall': 0.84, 'f1': 0.8377809995574914, 'support': None}}
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.8837675350701403, 'contradicts': 0.6935483870967742, 'parts_of_same': 0.7413793103448276}, 'recall': {'supports': 0.925498426023085, 'contradicts': 0.344, 'parts_of_same': 0.7904411764705882}, 'f1': {'supports': 0.9041517170681701, 'contradicts': 0.4598930481283422, 'parts_of_same': 0.7651245551601423}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8444444444444444, 'recall': 0.8444444444444444, 'f1': 0.8444444444444444, 'support': None}, 'macro_avg': {'precision': 0.7728984108372474, 'recall': 0.6866465341645577, 'f1': 0.7097231067855515, 'support': None}, 'weighted_avg': {'precision': 0.8374660605353583, 'recall': 0.8444444444444444, 'f1': 0.835005256581902, 'support': None}}
Loss: tensor(6.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.895855472901169, 'contradicts': 0.6326530612244898, 'parts_of_same': 0.7138263665594855}, 'recall': {'supports': 0.8845750262329486, 'contradicts': 0.496, 'parts_of_same': 0.8161764705882353}, 'f1': {'supports': 0.8901795142555439, 'contradicts': 0.5560538116591928, 'parts_of_same': 0.7615780445969126}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8348148148148148, 'recall': 0.8348148148148148, 'f1': 0.8348148148148148, 'support': None}, 'macro_avg': {'precision': 0.7474449668950481, 'recall': 0.7322504989403947, 'f1': 0.7359371235038831, 'support': None}, 'weighted_avg': {'precision': 0.8348093852089298, 'recall': 0.8348148148148148, 'f1': 0.8333311345728094, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.8884381338742393, 'contradicts': 0.7126436781609196, 'parts_of_same': 0.779783393501805}, 'recall': {'supports': 0.919202518363064, 'contradicts': 0.496, 'parts_of_same': 0.7941176470588235}, 'f1': {'supports': 0.9035585353274883, 'contradicts': 0.5849056603773585, 'parts_of_same': 0.7868852459016393}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8548148148148148, 'recall': 0.8548148148148148, 'f1': 0.8548148148148149, 'support': None}, 'macro_avg': {'precision': 0.7936217351789879, 'recall': 0.736440055140629, 'f1': 0.7584498138688286, 'support': None}, 'weighted_avg': {'precision': 0.8502689513961157, 'recall': 0.8548148148148148, 'f1': 0.8505461322959349, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8777335984095428, 'contradicts': 0.7532467532467533, 'parts_of_same': 0.7752808988764045}, 'recall': {'supports': 0.9265477439664218, 'contradicts': 0.464, 'parts_of_same': 0.7610294117647058}, 'f1': {'supports': 0.9014803471158755, 'contradicts': 0.5742574257425743, 'parts_of_same': 0.7680890538033395}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8503703703703703, 'recall': 0.8503703703703703, 'f1': 0.8503703703703703, 'support': None}, 'macro_avg': {'precision': 0.8020870835109002, 'recall': 0.7171923852437092, 'f1': 0.7479422755539297, 'support': None}, 'weighted_avg': {'precision': 0.8455647169885336, 'recall': 0.8503703703703703, 'f1': 0.8443060530768588, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.8830645161290323, 'contradicts': 0.6941176470588235, 'parts_of_same': 0.7655677655677655}, 'recall': {'supports': 0.919202518363064, 'contradicts': 0.472, 'parts_of_same': 0.7683823529411765}, 'f1': {'supports': 0.900771208226221, 'contradicts': 0.5619047619047619, 'parts_of_same': 0.7669724770642201}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8474074074074074, 'recall': 0.8474074074074074, 'f1': 0.8474074074074074, 'support': None}, 'macro_avg': {'precision': 0.7809166429185405, 'recall': 0.7198616237680802, 'f1': 0.7432161490650677, 'support': None}, 'weighted_avg': {'precision': 0.8418960162872244, 'recall': 0.8474074074074074, 'f1': 0.8424367188438161, 'support': None}}
Loss: tensor(4.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.8837209302325582, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7664233576642335}, 'recall': {'supports': 0.9171038824763903, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.9001029866117405, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7692307692307693}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8466666666666667, 'recall': 0.8466666666666667, 'f1': 0.8466666666666667, 'support': None}, 'macro_avg': {'precision': 0.7761017358123405, 'recall': 0.7203875686686007, 'f1': 0.7419791764758051, 'support': None}, 'weighted_avg': {'precision': 0.8410543072139468, 'recall': 0.8466666666666667, 'f1': 0.841929175681386, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.8836032388663968, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7636363636363637}, 'recall': {'supports': 0.9160545645330536, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8995363214837713, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7678244972577697}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.845925925925926, 'recall': 0.845925925925926, 'f1': 0.8459259259259259, 'support': None}, 'macro_avg': {'precision': 0.7751335073476634, 'recall': 0.7200377960208217, 'f1': 0.7413215307754822, 'support': None}, 'weighted_avg': {'precision': 0.8404096981417005, 'recall': 0.845925925925926, 'f1': 0.8412458143157486, 'support': None}}
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.8836032388663968, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7636363636363637}, 'recall': {'supports': 0.9160545645330536, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8995363214837713, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7678244972577697}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.845925925925926, 'recall': 0.845925925925926, 'f1': 0.8459259259259259, 'support': None}, 'macro_avg': {'precision': 0.7751335073476634, 'recall': 0.7200377960208217, 'f1': 0.7413215307754822, 'support': None}, 'weighted_avg': {'precision': 0.8404096981417005, 'recall': 0.845925925925926, 'f1': 0.8412458143157486, 'support': None}}
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8836032388663968, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7636363636363637}, 'recall': {'supports': 0.9160545645330536, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8995363214837713, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7678244972577697}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.845925925925926, 'recall': 0.845925925925926, 'f1': 0.8459259259259259, 'support': None}, 'macro_avg': {'precision': 0.7751335073476634, 'recall': 0.7200377960208217, 'f1': 0.7413215307754822, 'support': None}, 'weighted_avg': {'precision': 0.8404096981417005, 'recall': 0.845925925925926, 'f1': 0.8412458143157486, 'support': None}}
Loss: tensor(3.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.8836032388663968, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7636363636363637}, 'recall': {'supports': 0.9160545645330536, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8995363214837713, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7678244972577697}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.845925925925926, 'recall': 0.845925925925926, 'f1': 0.8459259259259259, 'support': None}, 'macro_avg': {'precision': 0.7751335073476634, 'recall': 0.7200377960208217, 'f1': 0.7413215307754822, 'support': None}, 'weighted_avg': {'precision': 0.8404096981417005, 'recall': 0.845925925925926, 'f1': 0.8412458143157486, 'support': None}}
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8834853090172239, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7608695652173914}, 'recall': {'supports': 0.9150052465897167, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8989690721649484, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7664233576642335}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7741719312582817, 'recall': 0.7196880233730428, 'f1': 0.7406654011380293, 'support': None}, 'weighted_avg': {'precision': 0.8397689897593138, 'recall': 0.8451851851851852, 'f1': 0.8405630746340597, 'support': None}}
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.8834853090172239, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7608695652173914}, 'recall': {'supports': 0.9150052465897167, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8989690721649484, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7664233576642335}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7741719312582817, 'recall': 0.7196880233730428, 'f1': 0.7406654011380293, 'support': None}, 'weighted_avg': {'precision': 0.8397689897593138, 'recall': 0.8451851851851852, 'f1': 0.8405630746340597, 'support': None}}
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.8834853090172239, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7608695652173914}, 'recall': {'supports': 0.9150052465897167, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8989690721649484, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7664233576642335}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7741719312582817, 'recall': 0.7196880233730428, 'f1': 0.7406654011380293, 'support': None}, 'weighted_avg': {'precision': 0.8397689897593138, 'recall': 0.8451851851851852, 'f1': 0.8405630746340597, 'support': None}}
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.8834853090172239, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7608695652173914}, 'recall': {'supports': 0.9150052465897167, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8989690721649484, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7664233576642335}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7741719312582817, 'recall': 0.7196880233730428, 'f1': 0.7406654011380293, 'support': None}, 'weighted_avg': {'precision': 0.8397689897593138, 'recall': 0.8451851851851852, 'f1': 0.8405630746340597, 'support': None}}
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.8834853090172239, 'contradicts': 0.6781609195402298, 'parts_of_same': 0.7608695652173914}, 'recall': {'supports': 0.9150052465897167, 'contradicts': 0.472, 'parts_of_same': 0.7720588235294118}, 'f1': {'supports': 0.8989690721649484, 'contradicts': 0.5566037735849056, 'parts_of_same': 0.7664233576642335}, 'support': {'supports': 953, 'contradicts': 125, 'parts_of_same': 272}, 'micro_avg': {'precision': 0.8451851851851852, 'recall': 0.8451851851851852, 'f1': 0.8451851851851852, 'support': None}, 'macro_avg': {'precision': 0.7741719312582817, 'recall': 0.7196880233730428, 'f1': 0.7406654011380293, 'support': None}, 'weighted_avg': {'precision': 0.8397689897593138, 'recall': 0.8451851851851852, 'f1': 0.8405630746340597, 'support': None}}
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 3-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7008797653958945, 'contradicts': 0.08974358974358974, 'parts_of_same': 0.07692307692307693}, 'recall': {'supports': 0.8929016189290162, 'contradicts': 0.08974358974358974, 'parts_of_same': 0.011583011583011582}, 'f1': {'supports': 0.7853231106243156, 'contradicts': 0.08974358974358974, 'parts_of_same': 0.020134228187919462}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.637719298245614, 'recall': 0.637719298245614, 'f1': 0.637719298245614, 'support': None}, 'macro_avg': {'precision': 0.28918214402085374, 'recall': 0.3314094067518725, 'f1': 0.29840030951860824, 'support': None}, 'weighted_avg': {'precision': 0.51730660397893, 'recall': 0.637719298245614, 'f1': 0.5638852832736813, 'support': None}}
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6105, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.8912386706948641, 'contradicts': 0.27307692307692305, 'parts_of_same': 0.7477064220183486}, 'recall': {'supports': 0.7347447073474471, 'contradicts': 0.9102564102564102, 'parts_of_same': 0.6293436293436293}, 'f1': {'supports': 0.8054607508532424, 'contradicts': 0.42011834319526625, 'parts_of_same': 0.6834381551362684}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.7228070175438597, 'recall': 0.7228070175438597, 'f1': 0.7228070175438598, 'support': None}, 'macro_avg': {'precision': 0.6373406719300453, 'recall': 0.7581149156491622, 'f1': 0.6363390830615924, 'support': None}, 'weighted_avg': {'precision': 0.8163338735708141, 'recall': 0.7228070175438597, 'f1': 0.7513725402497174, 'support': None}}
Loss: tensor(0.5028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9518796992481203, 'contradicts': 0.4774774774774775, 'parts_of_same': 0.6538461538461539}, 'recall': {'supports': 0.788293897882939, 'contradicts': 0.6794871794871795, 'parts_of_same': 0.918918918918919}, 'f1': {'supports': 0.8623978201634878, 'contradicts': 0.5608465608465608, 'parts_of_same': 0.7640449438202248}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8105263157894737, 'recall': 0.8105263157894737, 'f1': 0.8105263157894737, 'support': None}, 'macro_avg': {'precision': 0.6944011101905838, 'recall': 0.7955666654296792, 'f1': 0.7290964416100912, 'support': None}, 'weighted_avg': {'precision': 0.8517094698119628, 'recall': 0.8105263157894737, 'f1': 0.8194202822690796, 'support': None}}
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9167701863354037, 'contradicts': 0.611764705882353, 'parts_of_same': 0.824}, 'recall': {'supports': 0.917910447761194, 'contradicts': 0.6753246753246753, 'parts_of_same': 0.7953667953667953}, 'f1': {'supports': 0.9173399627097576, 'contradicts': 0.6419753086419754, 'parts_of_same': 0.8094302554027504}, 'support': {'supports': 804, 'contradicts': 77, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8736842105263158, 'recall': 0.8736842105263158, 'f1': 0.8736842105263158, 'support': None}, 'macro_avg': {'precision': 0.7841782974059188, 'recall': 0.7962006394842215, 'f1': 0.7895818422514944, 'support': None}, 'weighted_avg': {'precision': 0.8750922036549174, 'recall': 0.8736842105263158, 'f1': 0.8742244429240259, 'support': None}}
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9366906474820144, 'contradicts': 0.5181818181818182, 'parts_of_same': 0.6746268656716418}, 'recall': {'supports': 0.8107098381070984, 'contradicts': 0.7307692307692307, 'parts_of_same': 0.8725868725868726}, 'f1': {'supports': 0.8691588785046729, 'contradicts': 0.6063829787234042, 'parts_of_same': 0.7609427609427609}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8192982456140351, 'recall': 0.8192982456140351, 'f1': 0.8192982456140351, 'support': None}, 'macro_avg': {'precision': 0.7098331104451581, 'recall': 0.8046886471544005, 'f1': 0.7454948727236127, 'support': None}, 'weighted_avg': {'precision': 0.8485167806624513, 'recall': 0.8192982456140351, 'f1': 0.8265935323367131, 'support': None}}
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9094387755102041, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.7448275862068966}, 'recall': {'supports': 0.887920298879203, 'contradicts': 0.5641025641025641, 'parts_of_same': 0.833976833976834}, 'f1': {'supports': 0.8985507246376812, 'contradicts': 0.611111111111111, 'parts_of_same': 0.7868852459016394}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8535087719298246, 'recall': 0.8535087719298246, 'f1': 0.8535087719298247, 'support': None}, 'macro_avg': {'precision': 0.7736443427945892, 'recall': 0.7619998989862004, 'f1': 0.7655156938834772, 'support': None}, 'weighted_avg': {'precision': 0.8554295452300703, 'recall': 0.8535087719298246, 'f1': 0.853514190560745, 'support': None}}
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(10.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9119897959183674, 'contradicts': 0.7692307692307693, 'parts_of_same': 0.7335526315789473}, 'recall': {'supports': 0.8904109589041096, 'contradicts': 0.5128205128205128, 'parts_of_same': 0.861003861003861}, 'f1': {'supports': 0.9010712035286704, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.7921847246891651}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8578947368421053, 'recall': 0.8578947368421053, 'f1': 0.8578947368421053, 'support': None}, 'macro_avg': {'precision': 0.8049243989093613, 'recall': 0.7547451109094944, 'f1': 0.7695468478674835, 'support': None}, 'weighted_avg': {'precision': 0.861682401492453, 'recall': 0.8578947368421053, 'f1': 0.8567859825684352, 'support': None}}
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9015795868772782, 'contradicts': 0.7192982456140351, 'parts_of_same': 0.8076923076923077}, 'recall': {'supports': 0.9240348692403487, 'contradicts': 0.5256410256410257, 'parts_of_same': 0.8108108108108109}, 'f1': {'supports': 0.9126691266912669, 'contradicts': 0.6074074074074075, 'parts_of_same': 0.809248554913295}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8710526315789474, 'recall': 0.8710526315789474, 'f1': 0.8710526315789474, 'support': None}, 'macro_avg': {'precision': 0.8095233800612069, 'recall': 0.7534955685640617, 'f1': 0.7764416963373231, 'support': None}, 'weighted_avg': {'precision': 0.8677771746602254, 'recall': 0.8710526315789474, 'f1': 0.8682863703801829, 'support': None}}
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9117647058823529, 'contradicts': 0.6851851851851852, 'parts_of_same': 0.8148148148148148}, 'recall': {'supports': 0.9265255292652553, 'contradicts': 0.47435897435897434, 'parts_of_same': 0.8494208494208494}, 'f1': {'supports': 0.9190858554663373, 'contradicts': 0.5606060606060607, 'parts_of_same': 0.831758034026465}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8780701754385964, 'recall': 0.8780701754385964, 'f1': 0.8780701754385964, 'support': None}, 'macro_avg': {'precision': 0.8039215686274509, 'recall': 0.7501017843483596, 'f1': 0.7704833166996209, 'support': None}, 'weighted_avg': {'precision': 0.8742355616710622, 'recall': 0.8780701754385964, 'f1': 0.8747180223505228, 'support': None}}
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.8595505617977528, 'contradicts': 0.6811594202898551, 'parts_of_same': 0.8895027624309392}, 'recall': {'supports': 0.9526774595267746, 'contradicts': 0.6025641025641025, 'parts_of_same': 0.6216216216216216}, 'f1': {'supports': 0.9037212049616066, 'contradicts': 0.6394557823129252, 'parts_of_same': 0.7318181818181818}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8535087719298246, 'recall': 0.8535087719298246, 'f1': 0.8535087719298247, 'support': None}, 'macro_avg': {'precision': 0.8100709148395157, 'recall': 0.7256210612374995, 'f1': 0.7583317230309046, 'support': None}, 'weighted_avg': {'precision': 0.8541497819086118, 'recall': 0.8535087719298246, 'f1': 0.8465847260486731, 'support': None}}
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9298998569384835, 'contradicts': 0.6521739130434783, 'parts_of_same': 0.6075949367088608}, 'recall': {'supports': 0.8084577114427861, 'contradicts': 0.38461538461538464, 'parts_of_same': 0.9302325581395349}, 'f1': {'supports': 0.8649367930805056, 'contradicts': 0.4838709677419355, 'parts_of_same': 0.7350689127105666}, 'support': {'supports': 804, 'contradicts': 78, 'parts_of_same': 258}, 'micro_avg': {'precision': 0.8070175438596491, 'recall': 0.8070175438596491, 'f1': 0.8070175438596491, 'support': None}, 'macro_avg': {'precision': 0.7298895688969408, 'recall': 0.7077685513992352, 'f1': 0.6946255578443359, 'support': None}, 'weighted_avg': {'precision': 0.8379548630410685, 'recall': 0.8070175438596491, 'f1': 0.8094727163157225, 'support': None}}
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.910757946210269, 'contradicts': 0.7166666666666667, 'parts_of_same': 0.8320610687022901}, 'recall': {'supports': 0.9277708592777086, 'contradicts': 0.5512820512820513, 'parts_of_same': 0.8416988416988417}, 'f1': {'supports': 0.919185687847008, 'contradicts': 0.6231884057971016, 'parts_of_same': 0.836852207293666}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8824561403508772, 'recall': 0.8824561403508772, 'f1': 0.8824561403508772, 'support': None}, 'macro_avg': {'precision': 0.8198285605264086, 'recall': 0.7735839174195339, 'f1': 0.7930754336459253, 'support': None}, 'weighted_avg': {'precision': 0.8795986382462624, 'recall': 0.8824561403508772, 'f1': 0.8802276532301586, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9144316730523627, 'contradicts': 0.7272727272727273, 'parts_of_same': 0.7380191693290735}, 'recall': {'supports': 0.8916562889165629, 'contradicts': 0.41025641025641024, 'parts_of_same': 0.8918918918918919}, 'f1': {'supports': 0.9029003783102144, 'contradicts': 0.5245901639344261, 'parts_of_same': 0.8076923076923077}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8587719298245614, 'recall': 0.8587719298245614, 'f1': 0.8587719298245614, 'support': None}, 'macro_avg': {'precision': 0.7932411898847213, 'recall': 0.7312681970216216, 'f1': 0.7450609499789828, 'support': None}, 'weighted_avg': {'precision': 0.8615463781092545, 'recall': 0.8587719298245614, 'f1': 0.8553853897037677, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(11.6509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9106699751861043, 'contradicts': 0.6164383561643836, 'parts_of_same': 0.8237547892720306}, 'recall': {'supports': 0.9129353233830846, 'contradicts': 0.5769230769230769, 'parts_of_same': 0.8333333333333334}, 'f1': {'supports': 0.9118012422360249, 'contradicts': 0.5960264900662252, 'parts_of_same': 0.8285163776493256}, 'support': {'supports': 804, 'contradicts': 78, 'parts_of_same': 258}, 'micro_avg': {'precision': 0.8719298245614036, 'recall': 0.8719298245614036, 'f1': 0.8719298245614036, 'support': None}, 'macro_avg': {'precision': 0.7836210402075062, 'recall': 0.7743972445464983, 'f1': 0.7787813699838586, 'support': None}, 'weighted_avg': {'precision': 0.8708680591777489, 'recall': 0.8719298245614036, 'f1': 0.8713469214179435, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.922979797979798, 'contradicts': 0.6125, 'parts_of_same': 0.8208955223880597}, 'recall': {'supports': 0.9092039800995025, 'contradicts': 0.6282051282051282, 'parts_of_same': 0.8527131782945736}, 'f1': {'supports': 0.9160401002506267, 'contradicts': 0.620253164556962, 'parts_of_same': 0.8365019011406843}, 'support': {'supports': 804, 'contradicts': 78, 'parts_of_same': 258}, 'micro_avg': {'precision': 0.8771929824561403, 'recall': 0.8771929824561403, 'f1': 0.8771929824561403, 'support': None}, 'macro_avg': {'precision': 0.7854584401226193, 'recall': 0.7967074288664016, 'f1': 0.7909317219827576, 'support': None}, 'weighted_avg': {'precision': 0.8786331599577868, 'recall': 0.8771929824561403, 'f1': 0.8778012964309152, 'support': None}}
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9134734239802225, 'contradicts': 0.5955056179775281, 'parts_of_same': 0.8553719008264463}, 'recall': {'supports': 0.9202988792029888, 'contradicts': 0.6794871794871795, 'parts_of_same': 0.7992277992277992}, 'f1': {'supports': 0.9168734491315137, 'contradicts': 0.6347305389221557, 'parts_of_same': 0.8263473053892216}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8763157894736842, 'recall': 0.8763157894736842, 'f1': 0.8763157894736842, 'support': None}, 'macro_avg': {'precision': 0.7881169809280656, 'recall': 0.7996712859726558, 'f1': 0.7926504311476302, 'support': None}, 'weighted_avg': {'precision': 0.8785174736600134, 'recall': 0.8763157894736842, 'f1': 0.8770020296353878, 'support': None}}
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(12.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9135338345864662, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.8068181818181818}, 'recall': {'supports': 0.9078455790784558, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.8223938223938224}, 'f1': {'supports': 0.910680824484697, 'contradicts': 0.6153846153846154, 'parts_of_same': 0.81453154875717}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.868421052631579, 'recall': 0.868421052631579, 'f1': 0.868421052631579, 'support': None}, 'macro_avg': {'precision': 0.7785788772630878, 'recall': 0.7818746722856312, 'f1': 0.7801989962088275, 'support': None}, 'weighted_avg': {'precision': 0.8688891037402119, 'recall': 0.868421052631579, 'f1': 0.86863190630642, 'support': None}}
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9363762102351314, 'contradicts': 0.452991452991453, 'parts_of_same': 0.7566666666666667}, 'recall': {'supports': 0.8430884184308842, 'contradicts': 0.6794871794871795, 'parts_of_same': 0.8764478764478765}, 'f1': {'supports': 0.8872870249017037, 'contradicts': 0.5435897435897437, 'parts_of_same': 0.8121645796064402}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8394736842105263, 'recall': 0.8394736842105263, 'f1': 0.8394736842105263, 'support': None}, 'macro_avg': {'precision': 0.7153447766310838, 'recall': 0.7996744914553133, 'f1': 0.7476804493659626, 'support': None}, 'weighted_avg': {'precision': 0.8624737691393075, 'recall': 0.8394736842105263, 'f1': 0.8467036027316984, 'support': None}}
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8747044917257684, 'contradicts': 0.589041095890411, 'parts_of_same': 0.832579185520362}, 'recall': {'supports': 0.9203980099502488, 'contradicts': 0.5512820512820513, 'parts_of_same': 0.7131782945736435}, 'f1': {'supports': 0.896969696969697, 'contradicts': 0.5695364238410597, 'parts_of_same': 0.768267223382046}, 'support': {'supports': 804, 'contradicts': 78, 'parts_of_same': 258}, 'micro_avg': {'precision': 0.8482456140350877, 'recall': 0.8482456140350877, 'f1': 0.8482456140350877, 'support': None}, 'macro_avg': {'precision': 0.7654415910455138, 'recall': 0.7282861186019812, 'f1': 0.7449244480642676, 'support': None}, 'weighted_avg': {'precision': 0.8456254795537045, 'recall': 0.8482456140350877, 'f1': 0.845438965838427, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.8834720570749108, 'contradicts': 0.6231884057971014, 'parts_of_same': 0.8304347826086956}, 'recall': {'supports': 0.925280199252802, 'contradicts': 0.5512820512820513, 'parts_of_same': 0.7374517374517374}, 'f1': {'supports': 0.9038929440389294, 'contradicts': 0.5850340136054423, 'parts_of_same': 0.7811860940695297}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8570175438596491, 'recall': 0.8570175438596491, 'f1': 0.8570175438596491, 'support': None}, 'macro_avg': {'precision': 0.7790317484935693, 'recall': 0.7380046626621969, 'f1': 0.7567043505713004, 'support': None}, 'weighted_avg': {'precision': 0.8536134791043679, 'recall': 0.8570175438596491, 'f1': 0.8541981451653446, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.8827014218009479, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.8304347826086956}, 'recall': {'supports': 0.9277708592777086, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7374517374517374}, 'f1': {'supports': 0.9046751669702489, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7811860940695297}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8578947368421053, 'recall': 0.8578947368421053, 'f1': 0.8578947368421053, 'support': None}, 'macro_avg': {'precision': 0.7831666135910932, 'recall': 0.7345613783969949, 'f1': 0.7563981981243707, 'support': None}, 'weighted_avg': {'precision': 0.8539721175773483, 'recall': 0.8578947368421053, 'f1': 0.8546327696851912, 'support': None}}
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.8837485172004745, 'contradicts': 0.6307692307692307, 'parts_of_same': 0.8275862068965517}, 'recall': {'supports': 0.9266169154228856, 'contradicts': 0.5324675324675324, 'parts_of_same': 0.7413127413127413}, 'f1': {'supports': 0.904675166970249, 'contradicts': 0.5774647887323944, 'parts_of_same': 0.7820773930753564}, 'support': {'supports': 804, 'contradicts': 77, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8578947368421053, 'recall': 0.8578947368421053, 'f1': 0.8578947368421053, 'support': None}, 'macro_avg': {'precision': 0.7807013182887523, 'recall': 0.7334657297343864, 'f1': 0.7547391162593332, 'support': None}, 'weighted_avg': {'precision': 0.853901637004052, 'recall': 0.8578947368421053, 'f1': 0.8547207612131508, 'support': None}}
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.8846611177170036, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.8240343347639485}, 'recall': {'supports': 0.9265255292652553, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7413127413127413}, 'f1': {'supports': 0.9051094890510949, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7804878048780487}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8578947368421053, 'recall': 0.8578947368421053, 'f1': 0.8578947368421053, 'support': None}, 'macro_avg': {'precision': 0.7816863629481962, 'recall': 0.735433269679845, 'f1': 0.7563102090874922, 'support': None}, 'weighted_avg': {'precision': 0.8538983630412106, 'recall': 0.8578947368421053, 'f1': 0.8547800536591612, 'support': None}}
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8866348448687351, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.8220338983050848}, 'recall': {'supports': 0.925280199252802, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.749034749034749}, 'f1': {'supports': 0.9055453991468618, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7838383838383839}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8587719298245614, 'recall': 0.8587719298245614, 'f1': 0.8587719298245614, 'support': None}, 'macro_avg': {'precision': 0.7816774598458188, 'recall': 0.7375921622496965, 'f1': 0.7575723721061931, 'support': None}, 'weighted_avg': {'precision': 0.8548341436201534, 'recall': 0.8587719298245614, 'f1': 0.8558483306395364, 'support': None}}
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9899e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.8864994026284349, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.8185654008438819}, 'recall': {'supports': 0.9240348692403487, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.749034749034749}, 'f1': {'supports': 0.9048780487804877, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.782258064516129}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8578947368421053, 'recall': 0.8578947368421053, 'f1': 0.8578947368421053, 'support': None}, 'macro_avg': {'precision': 0.7804761466119844, 'recall': 0.7371770522455453, 'f1': 0.75682314887665, 'support': None}, 'weighted_avg': {'precision': 0.8539507217241774, 'recall': 0.8578947368421053, 'f1': 0.8550192209477272, 'support': None}}
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8875598086124402, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.819327731092437}, 'recall': {'supports': 0.9240348692403487, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.752895752895753}, 'f1': {'supports': 0.9054301403294692, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7847082494969819}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8587719298245614, 'recall': 0.8587719298245614, 'f1': 0.8587719298245614, 'support': None}, 'macro_avg': {'precision': 0.7810837253561712, 'recall': 0.7384640535325467, 'f1': 0.7578239077199281, 'support': None}, 'weighted_avg': {'precision': 0.8548708528992055, 'recall': 0.8587719298245614, 'f1': 0.8559647713195456, 'support': None}}
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.8875598086124402, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.819327731092437}, 'recall': {'supports': 0.9240348692403487, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.752895752895753}, 'f1': {'supports': 0.9054301403294692, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7847082494969819}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8587719298245614, 'recall': 0.8587719298245614, 'f1': 0.8587719298245614, 'support': None}, 'macro_avg': {'precision': 0.7810837253561712, 'recall': 0.7384640535325467, 'f1': 0.7578239077199281, 'support': None}, 'weighted_avg': {'precision': 0.8548708528992055, 'recall': 0.8587719298245614, 'f1': 0.8559647713195456, 'support': None}}
Loss: tensor(6.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.888622754491018, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.8200836820083682}, 'recall': {'supports': 0.9240348692403487, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7567567567567568}, 'f1': {'supports': 0.9059829059829061, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7871485943775102}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8596491228070176, 'recall': 0.8596491228070176, 'f1': 0.8596491228070176, 'support': None}, 'macro_avg': {'precision': 0.7816900242876742, 'recall': 0.7397510548195481, 'f1': 0.7588216112312498, 'support': None}, 'weighted_avg': {'precision': 0.855791323800718, 'recall': 0.8596491228070176, 'f1': 0.856908560919341, 'support': None}}
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.888755980861244, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.819327731092437}, 'recall': {'supports': 0.9241293532338308, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7558139534883721}, 'f1': {'supports': 0.9060975609756097, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7862903225806451}, 'support': {'supports': 804, 'contradicts': 78, 'parts_of_same': 258}, 'micro_avg': {'precision': 0.8596491228070176, 'recall': 0.8596491228070176, 'f1': 0.8596491228070176, 'support': None}, 'macro_avg': {'precision': 0.7814824494391056, 'recall': 0.7394682817279138, 'f1': 0.758573738963196, 'support': None}, 'weighted_avg': {'precision': 0.8557743218163619, 'recall': 0.8596491228070176, 'f1': 0.8568994230264882, 'support': None}}
Loss: tensor(6.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.8895558223289316, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.8174273858921162}, 'recall': {'supports': 0.9227895392278954, 'contradicts': 0.5384615384615384, 'parts_of_same': 0.7606177606177607}, 'f1': {'supports': 0.9058679706601467, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7879999999999999}, 'support': {'supports': 803, 'contradicts': 78, 'parts_of_same': 259}, 'micro_avg': {'precision': 0.8596491228070176, 'recall': 0.8596491228070176, 'f1': 0.8596491228070176, 'support': None}, 'macro_avg': {'precision': 0.7811156148615614, 'recall': 0.7406229461023982, 'f1': 0.75906710133116, 'support': None}, 'weighted_avg': {'precision': 0.8558450718531174, 'recall': 0.8596491228070176, 'f1': 0.85702103547377, 'support': None}}
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 4-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7307692307692307, 'contradicts': 0.13106796116504854, 'parts_of_same': 0.1956521739130435}, 'recall': {'supports': 0.2693565976008724, 'contradicts': 0.23478260869565218, 'parts_of_same': 0.5806451612903226}, 'f1': {'supports': 0.3936254980079681, 'contradicts': 0.16822429906542055, 'parts_of_same': 0.29268292682926833}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.3265625, 'recall': 0.3265625, 'f1': 0.3265625, 'support': None}, 'macro_avg': {'precision': 0.35249645528244095, 'recall': 0.3615947891956157, 'f1': 0.28484424130088565, 'support': None}, 'weighted_avg': {'precision': 0.5732108900623436, 'recall': 0.3265625, 'f1': 0.3538169858746005, 'support': None}}
Loss: tensor(1.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.906721536351166, 'contradicts': 0.4482758620689655, 'parts_of_same': 0.5517241379310345}, 'recall': {'supports': 0.7208287895310797, 'contradicts': 0.7913043478260869, 'parts_of_same': 0.7741935483870968}, 'f1': {'supports': 0.8031591737545566, 'contradicts': 0.5723270440251572, 'parts_of_same': 0.6442953020134228}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.7375, 'recall': 0.7375, 'f1': 0.7375, 'support': None}, 'macro_avg': {'precision': 0.6355738454503886, 'recall': 0.7621088952480877, 'f1': 0.6732605065977122, 'support': None}, 'weighted_avg': {'precision': 0.7967523118584741, 'recall': 0.7375, 'f1': 0.7516404744493362, 'support': None}}
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9608150470219435, 'contradicts': 0.48295454545454547, 'parts_of_same': 0.5021459227467812}, 'recall': {'supports': 0.6684841875681571, 'contradicts': 0.7391304347826086, 'parts_of_same': 0.9435483870967742}, 'f1': {'supports': 0.7884244372990353, 'contradicts': 0.584192439862543, 'parts_of_same': 0.6554621848739497}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.728125, 'recall': 0.728125, 'f1': 0.7281249999999999, 'support': None}, 'macro_avg': {'precision': 0.6486385050744233, 'recall': 0.78372100314918, 'f1': 0.6760263540118426, 'support': None}, 'weighted_avg': {'precision': 0.8290151247559349, 'recall': 0.728125, 'f1': 0.7443140323719901, 'support': None}}
Loss: tensor(0.5401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9141242937853107, 'contradicts': 0.5538461538461539, 'parts_of_same': 0.7622641509433963}, 'recall': {'supports': 0.8822246455834242, 'contradicts': 0.6260869565217392, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.8978912319644838, 'contradicts': 0.5877551020408163, 'parts_of_same': 0.7875243664717348}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.84609375, 'recall': 0.84609375, 'f1': 0.84609375, 'support': None}, 'macro_avg': {'precision': 0.743411532858287, 'recall': 0.7742759103791405, 'f1': 0.7577235668256783, 'support': None}, 'weighted_avg': {'precision': 0.8523326519745312, 'recall': 0.84609375, 'f1': 0.8486438588524342, 'support': None}}
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9265605875152999, 'contradicts': 0.4913294797687861, 'parts_of_same': 0.7103448275862069}, 'recall': {'supports': 0.8255179934569248, 'contradicts': 0.7391304347826086, 'parts_of_same': 0.8306451612903226}, 'f1': {'supports': 0.8731257208765859, 'contradicts': 0.5902777777777777, 'parts_of_same': 0.7657992565055762}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.81875, 'recall': 0.81875, 'f1': 0.81875, 'support': None}, 'macro_avg': {'precision': 0.709411631623431, 'recall': 0.7984311965099521, 'f1': 0.7430675850533133, 'support': None}, 'weighted_avg': {'precision': 0.8455659891924373, 'recall': 0.81875, 'f1': 0.8269190985169192, 'support': None}}
Loss: tensor(9.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.909297052154195, 'contradicts': 0.6739130434782609, 'parts_of_same': 0.673202614379085}, 'recall': {'supports': 0.8745910577971646, 'contradicts': 0.5391304347826087, 'parts_of_same': 0.8306451612903226}, 'f1': {'supports': 0.8916064480266813, 'contradicts': 0.5990338164251208, 'parts_of_same': 0.743682310469314}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8359375, 'recall': 0.8359375, 'f1': 0.8359375, 'support': None}, 'macro_avg': {'precision': 0.7521375700038471, 'recall': 0.7481222179566985, 'f1': 0.7447741916403721, 'support': None}, 'weighted_avg': {'precision': 0.8424059728057889, 'recall': 0.8359375, 'f1': 0.8366603240044886, 'support': None}}
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9224629418472063, 'contradicts': 0.5985915492957746, 'parts_of_same': 0.7432950191570882}, 'recall': {'supports': 0.8822246455834242, 'contradicts': 0.7391304347826086, 'parts_of_same': 0.782258064516129}, 'f1': {'supports': 0.9018952062430322, 'contradicts': 0.6614785992217898, 'parts_of_same': 0.762278978388998}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.85, 'recall': 0.85, 'f1': 0.85, 'support': None}, 'macro_avg': {'precision': 0.754783170100023, 'recall': 0.8012043816273873, 'f1': 0.7752175946179399, 'support': None}, 'weighted_avg': {'precision': 0.8586513364014532, 'recall': 0.85, 'f1': 0.8532446325592483, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.8908523908523909, 'contradicts': 0.7386363636363636, 'parts_of_same': 0.7956521739130434}, 'recall': {'supports': 0.9345692475463467, 'contradicts': 0.5652173913043478, 'parts_of_same': 0.7379032258064516}, 'f1': {'supports': 0.912187333688132, 'contradicts': 0.6403940886699507, 'parts_of_same': 0.7656903765690376}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.86328125, 'recall': 0.86328125, 'f1': 0.86328125, 'support': None}, 'macro_avg': {'precision': 0.808380309467266, 'recall': 0.745896621552382, 'f1': 0.7727572663090401, 'support': None}, 'weighted_avg': {'precision': 0.8587316901252023, 'recall': 0.86328125, 'f1': 0.8593846238892052, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9228110599078341, 'contradicts': 0.5801526717557252, 'parts_of_same': 0.7473309608540926}, 'recall': {'supports': 0.8735005452562704, 'contradicts': 0.6608695652173913, 'parts_of_same': 0.8467741935483871}, 'f1': {'supports': 0.8974789915966387, 'contradicts': 0.6178861788617886, 'parts_of_same': 0.7939508506616259}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.84921875, 'recall': 0.84921875, 'f1': 0.84921875, 'support': None}, 'macro_avg': {'precision': 0.7500982308392173, 'recall': 0.7937147680073496, 'f1': 0.7697720070400177, 'support': None}, 'weighted_avg': {'precision': 0.8580260761556306, 'recall': 0.84921875, 'f1': 0.8523007475213331, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.921968787515006, 'contradicts': 0.631578947368421, 'parts_of_same': 0.6306306306306306}, 'recall': {'supports': 0.8375136314067612, 'contradicts': 0.6260869565217392, 'parts_of_same': 0.8467741935483871}, 'f1': {'supports': 0.8777142857142857, 'contradicts': 0.6288209606986899, 'parts_of_same': 0.7228915662650602}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8203125, 'recall': 0.8203125, 'f1': 0.8203125, 'support': None}, 'macro_avg': {'precision': 0.7280594551713525, 'recall': 0.7701249271589625, 'f1': 0.7431422708926786, 'support': None}, 'weighted_avg': {'precision': 0.8394323074179886, 'recall': 0.8203125, 'f1': 0.8253558741516283, 'support': None}}
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9307511737089202, 'contradicts': 0.54, 'parts_of_same': 0.7410071942446043}, 'recall': {'supports': 0.8647764449291166, 'contradicts': 0.7043478260869566, 'parts_of_same': 0.8306451612903226}, 'f1': {'supports': 0.8965517241379309, 'contradicts': 0.6113207547169812, 'parts_of_same': 0.7832699619771863}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.84375, 'recall': 0.84375, 'f1': 0.84375, 'support': None}, 'macro_avg': {'precision': 0.7372527893178416, 'recall': 0.7999231441021318, 'f1': 0.7637141469440328, 'support': None}, 'weighted_avg': {'precision': 0.8588817269247982, 'recall': 0.84375, 'f1': 0.8489771628103732, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9181494661921709, 'contradicts': 0.40869565217391307, 'parts_of_same': 0.8357487922705314}, 'recall': {'supports': 0.8440567066521265, 'contradicts': 0.8173913043478261, 'parts_of_same': 0.6975806451612904}, 'f1': {'supports': 0.8795454545454545, 'contradicts': 0.5449275362318841, 'parts_of_same': 0.7604395604395604}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.81328125, 'recall': 0.81328125, 'f1': 0.81328125, 'support': None}, 'macro_avg': {'precision': 0.7208646368788717, 'recall': 0.786342885387081, 'f1': 0.7283041837389663, 'support': None}, 'weighted_avg': {'precision': 0.8564130945166504, 'recall': 0.81328125, 'f1': 0.8264053589639527, 'support': None}}
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9159192825112108, 'contradicts': 0.5460992907801419, 'parts_of_same': 0.7894736842105263}, 'recall': {'supports': 0.8909487459105779, 'contradicts': 0.6695652173913044, 'parts_of_same': 0.7862903225806451}, 'f1': {'supports': 0.9032614704256495, 'contradicts': 0.6015625000000001, 'parts_of_same': 0.7878787878787878}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.85078125, 'recall': 0.85078125, 'f1': 0.85078125, 'support': None}, 'macro_avg': {'precision': 0.7504974191672931, 'recall': 0.7822680952941758, 'f1': 0.7642342527681457, 'support': None}, 'weighted_avg': {'precision': 0.858194432958365, 'recall': 0.85078125, 'f1': 0.8538003088080156, 'support': None}}
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9237770193401593, 'contradicts': 0.6206896551724138, 'parts_of_same': 0.7228070175438597}, 'recall': {'supports': 0.8854961832061069, 'contradicts': 0.6260869565217392, 'parts_of_same': 0.8306451612903226}, 'f1': {'supports': 0.9042316258351895, 'contradicts': 0.6233766233766235, 'parts_of_same': 0.7729831144465291}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8515625, 'recall': 0.8515625, 'f1': 0.8515625, 'support': None}, 'macro_avg': {'precision': 0.7557578973521443, 'recall': 0.7807427670060562, 'f1': 0.766863787886114, 'support': None}, 'weighted_avg': {'precision': 0.8576085761176803, 'recall': 0.8515625, 'f1': 0.8535691601264999, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9044038668098818, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.7854251012145749}, 'recall': {'supports': 0.9182115594329335, 'contradicts': 0.591304347826087, 'parts_of_same': 0.782258064516129}, 'f1': {'supports': 0.9112554112554113, 'contradicts': 0.6267281105990784, 'parts_of_same': 0.7838383838383838}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7854985448970412, 'recall': 0.7639246572583831, 'f1': 0.7739406352309578, 'support': None}, 'weighted_avg': {'precision': 0.859992529400424, 'recall': 0.8625, 'f1': 0.8610053625250197, 'support': None}}
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9140969162995595, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.7709923664122137}, 'recall': {'supports': 0.9051254089422028, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9095890410958903, 'contradicts': 0.6222222222222223, 'parts_of_same': 0.792156862745098}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7738176396918032, 'recall': 0.7761123967161246, 'f1': 0.7746560420210703, 'support': None}, 'weighted_avg': {'precision': 0.8614178103896432, 'recall': 0.8609375, 'f1': 0.8610184439072432, 'support': None}}
Loss: tensor(9.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9131868131868132, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7739463601532567}, 'recall': {'supports': 0.906215921483097, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9096880131362889, 'contradicts': 0.625, 'parts_of_same': 0.7937131630648331}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.86171875, 'recall': 0.86171875, 'f1': 0.86171875, 'support': None}, 'macro_avg': {'precision': 0.7764450027341517, 'recall': 0.7764759008964227, 'f1': 0.7761337254003741, 'support': None}, 'weighted_avg': {'precision': 0.8618626687652263, 'recall': 0.86171875, 'f1': 0.8616404472547309, 'support': None}}
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(2.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(1.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(6.0339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(2.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9132821075740944, 'contradicts': 0.6422018348623854, 'parts_of_same': 0.7769230769230769}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6086956521739131, 'parts_of_same': 0.8145161290322581}, 'f1': {'supports': 0.9102844638949672, 'contradicts': 0.625, 'parts_of_same': 0.7952755905511811}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8625, 'recall': 0.8625, 'f1': 0.8625, 'support': None}, 'macro_avg': {'precision': 0.7774690064531855, 'recall': 0.7768394050767208, 'f1': 0.7768533514820494, 'support': None}, 'weighted_avg': {'precision': 0.8625076771340172, 'recall': 0.8625, 'f1': 0.8623704686315452, 'support': None}}
Loss: tensor(2.3228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9112814895947426, 'contradicts': 0.6388888888888888, 'parts_of_same': 0.7760617760617761}, 'recall': {'supports': 0.9073064340239912, 'contradicts': 0.6, 'parts_of_same': 0.8104838709677419}, 'f1': {'supports': 0.9092896174863389, 'contradicts': 0.6188340807174887, 'parts_of_same': 0.7928994082840236}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.8609375, 'recall': 0.8609375, 'f1': 0.8609375, 'support': None}, 'macro_avg': {'precision': 0.7754107181818025, 'recall': 0.7725967683305778, 'f1': 0.7736743688292838, 'support': None}, 'weighted_avg': {'precision': 0.8606098973780638, 'recall': 0.8609375, 'f1': 0.8606433998218138, 'support': None}}
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9113785557986871, 'contradicts': 0.6448598130841121, 'parts_of_same': 0.7760617760617761}, 'recall': {'supports': 0.9083969465648855, 'contradicts': 0.6, 'parts_of_same': 0.8104838709677419}, 'f1': {'supports': 0.9098853085745495, 'contradicts': 0.6216216216216217, 'parts_of_same': 0.7928994082840236}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.86171875, 'recall': 0.86171875, 'f1': 0.86171875, 'support': None}, 'macro_avg': {'precision': 0.7774333816481919, 'recall': 0.7729602725108758, 'f1': 0.7748021128267316, 'support': None}, 'weighted_avg': {'precision': 0.861215886433898, 'recall': 0.86171875, 'f1': 0.861320599768583, 'support': None}}
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5351e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9113785557986871, 'contradicts': 0.6448598130841121, 'parts_of_same': 0.7760617760617761}, 'recall': {'supports': 0.9083969465648855, 'contradicts': 0.6, 'parts_of_same': 0.8104838709677419}, 'f1': {'supports': 0.9098853085745495, 'contradicts': 0.6216216216216217, 'parts_of_same': 0.7928994082840236}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.86171875, 'recall': 0.86171875, 'f1': 0.86171875, 'support': None}, 'macro_avg': {'precision': 0.7774333816481919, 'recall': 0.7729602725108758, 'f1': 0.7748021128267316, 'support': None}, 'weighted_avg': {'precision': 0.861215886433898, 'recall': 0.86171875, 'f1': 0.861320599768583, 'support': None}}
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3114e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8022e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9113785557986871, 'contradicts': 0.6448598130841121, 'parts_of_same': 0.7760617760617761}, 'recall': {'supports': 0.9083969465648855, 'contradicts': 0.6, 'parts_of_same': 0.8104838709677419}, 'f1': {'supports': 0.9098853085745495, 'contradicts': 0.6216216216216217, 'parts_of_same': 0.7928994082840236}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.86171875, 'recall': 0.86171875, 'f1': 0.86171875, 'support': None}, 'macro_avg': {'precision': 0.7774333816481919, 'recall': 0.7729602725108758, 'f1': 0.7748021128267316, 'support': None}, 'weighted_avg': {'precision': 0.861215886433898, 'recall': 0.86171875, 'f1': 0.861320599768583, 'support': None}}
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9123767798466593, 'contradicts': 0.6448598130841121, 'parts_of_same': 0.7730769230769231}, 'recall': {'supports': 0.9083969465648855, 'contradicts': 0.6, 'parts_of_same': 0.8104838709677419}, 'f1': {'supports': 0.9103825136612022, 'contradicts': 0.6216216216216217, 'parts_of_same': 0.7913385826771654}, 'support': {'supports': 917, 'contradicts': 115, 'parts_of_same': 248}, 'micro_avg': {'precision': 0.86171875, 'recall': 0.86171875, 'f1': 0.86171875, 'support': None}, 'macro_avg': {'precision': 0.7767711720025648, 'recall': 0.7729602725108758, 'f1': 0.7744475726533296, 'support': None}, 'weighted_avg': {'precision': 0.8613527051149503, 'recall': 0.86171875, 'f1': 0.861374390638864, 'support': None}}
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0443e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0781e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4402e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6212e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7675e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7801e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9417e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8323e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 5-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.6934579439252336, 'contradicts': 0.09689213893967093, 'parts_of_same': 0.1791044776119403}, 'recall': {'supports': 0.4364705882352941, 'contradicts': 0.45689655172413796, 'parts_of_same': 0.096}, 'f1': {'supports': 0.535740072202166, 'contradicts': 0.15987933634992457, 'parts_of_same': 0.125}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.3684210526315789, 'recall': 0.3684210526315789, 'f1': 0.3684210526315789, 'support': None}, 'macro_avg': {'precision': 0.32315152015894827, 'recall': 0.329789046653144, 'f1': 0.27353980285069684, 'support': None}, 'weighted_avg': {'precision': 0.5308016939608845, 'recall': 0.3684210526315789, 'f1': 0.4154400200562766, 'support': None}}
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.8841607565011821, 'contradicts': 0.5419847328244275, 'parts_of_same': 0.7364016736401674}, 'recall': {'supports': 0.88, 'contradicts': 0.6120689655172413, 'parts_of_same': 0.704}, 'f1': {'supports': 0.8820754716981133, 'contradicts': 0.5748987854251013, 'parts_of_same': 0.7198364008179959}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8182565789473685, 'recall': 0.8182565789473685, 'f1': 0.8182565789473685, 'support': None}, 'macro_avg': {'precision': 0.7208490543219256, 'recall': 0.7320229885057472, 'f1': 0.7256035526470702, 'support': None}, 'weighted_avg': {'precision': 0.8211408638517107, 'recall': 0.8182565789473685, 'f1': 0.8194173604088874, 'support': None}}
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6990, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9363636363636364, 'contradicts': 0.363265306122449, 'parts_of_same': 0.6527331189710611}, 'recall': {'supports': 0.7270588235294118, 'contradicts': 0.7672413793103449, 'parts_of_same': 0.812}, 'f1': {'supports': 0.8185430463576158, 'contradicts': 0.4930747922437673, 'parts_of_same': 0.7237076648841354}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.7483552631578947, 'recall': 0.7483552631578947, 'f1': 0.7483552631578947, 'support': None}, 'macro_avg': {'precision': 0.6507873538190488, 'recall': 0.7687667342799189, 'f1': 0.6784418344951728, 'support': None}, 'weighted_avg': {'precision': 0.8233808767780102, 'recall': 0.7483552631578947, 'f1': 0.7679976821753982, 'support': None}}
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9077540106951871, 'contradicts': 0.68, 'parts_of_same': 0.5652173913043478}, 'recall': {'supports': 0.7988235294117647, 'contradicts': 0.5862068965517241, 'parts_of_same': 0.832}, 'f1': {'supports': 0.8498122653316645, 'contradicts': 0.6296296296296295, 'parts_of_same': 0.6731391585760518}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.7853618421052632, 'recall': 0.7853618421052632, 'f1': 0.7853618421052632, 'support': None}, 'macro_avg': {'precision': 0.717657133999845, 'recall': 0.7390101419878295, 'f1': 0.7175270178457819, 'support': None}, 'weighted_avg': {'precision': 0.815604652069898, 'recall': 0.7853618421052632, 'f1': 0.7924854047803988, 'support': None}}
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.883855981416957, 'contradicts': 0.6106194690265486, 'parts_of_same': 0.7479338842975206}, 'recall': {'supports': 0.8952941176470588, 'contradicts': 0.5948275862068966, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8895382817066043, 'contradicts': 0.6026200873362445, 'parts_of_same': 0.7357723577235773}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8314144736842105, 'recall': 0.8314144736842105, 'f1': 0.8314144736842105, 'support': None}, 'macro_avg': {'precision': 0.7474697782470088, 'recall': 0.7380405679513183, 'f1': 0.7426435755888088, 'support': None}, 'weighted_avg': {'precision': 0.829846146123251, 'recall': 0.8314144736842105, 'f1': 0.8305547360300266, 'support': None}}
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.8829915560916767, 'contradicts': 0.553030303030303, 'parts_of_same': 0.6980392156862745}, 'recall': {'supports': 0.8611764705882353, 'contradicts': 0.6293103448275862, 'parts_of_same': 0.712}, 'f1': {'supports': 0.8719475878499107, 'contradicts': 0.5887096774193549, 'parts_of_same': 0.7049504950495049}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8083881578947368, 'recall': 0.8083881578947368, 'f1': 0.8083881578947368, 'support': None}, 'macro_avg': {'precision': 0.7113536916027513, 'recall': 0.7341622718052738, 'f1': 0.7218692534395901, 'support': None}, 'weighted_avg': {'precision': 0.8134902481505007, 'recall': 0.8083881578947368, 'f1': 0.8105948980390176, 'support': None}}
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(13.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.8985330073349633, 'contradicts': 0.518796992481203, 'parts_of_same': 0.7320754716981132}, 'recall': {'supports': 0.8647058823529412, 'contradicts': 0.5948275862068966, 'parts_of_same': 0.776}, 'f1': {'supports': 0.881294964028777, 'contradicts': 0.5542168674698795, 'parts_of_same': 0.753398058252427}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8207236842105263, 'recall': 0.8207236842105263, 'f1': 0.8207236842105263, 'support': None}, 'macro_avg': {'precision': 0.7164684905047598, 'recall': 0.7451778228532793, 'f1': 0.7296366299170279, 'support': None}, 'weighted_avg': {'precision': 0.828085834940022, 'recall': 0.8207236842105263, 'f1': 0.8237988409655208, 'support': None}}
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.8806306306306306, 'contradicts': 0.6095238095238096, 'parts_of_same': 0.820627802690583}, 'recall': {'supports': 0.92, 'contradicts': 0.5517241379310345, 'parts_of_same': 0.732}, 'f1': {'supports': 0.8998849252013809, 'contradicts': 0.5791855203619909, 'parts_of_same': 0.7737843551797039}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8462171052631579, 'recall': 0.8462171052631579, 'f1': 0.8462171052631579, 'support': None}, 'macro_avg': {'precision': 0.7702607476150077, 'recall': 0.7345747126436782, 'f1': 0.7509516002476918, 'support': None}, 'weighted_avg': {'precision': 0.8424323590571084, 'recall': 0.8462171052631579, 'f1': 0.8433666082056666, 'support': None}}
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.8941736028537456, 'contradicts': 0.5818181818181818, 'parts_of_same': 0.7396226415094339}, 'recall': {'supports': 0.8847058823529412, 'contradicts': 0.5517241379310345, 'parts_of_same': 0.784}, 'f1': {'supports': 0.8894145476049675, 'contradicts': 0.5663716814159292, 'parts_of_same': 0.7611650485436892}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8322368421052632, 'recall': 0.8322368421052632, 'f1': 0.8322368421052633, 'support': None}, 'macro_avg': {'precision': 0.7385381420604538, 'recall': 0.7401433400946585, 'f1': 0.7389837591881953, 'support': None}, 'weighted_avg': {'precision': 0.832602082149631, 'recall': 0.8322368421052632, 'f1': 0.8322308738851912, 'support': None}}
Loss: tensor(4.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9045161290322581, 'contradicts': 0.5323741007194245, 'parts_of_same': 0.6589403973509934}, 'recall': {'supports': 0.8247058823529412, 'contradicts': 0.6379310344827587, 'parts_of_same': 0.796}, 'f1': {'supports': 0.8627692307692307, 'contradicts': 0.5803921568627451, 'parts_of_same': 0.7210144927536232}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8009868421052632, 'recall': 0.8009868421052632, 'f1': 0.8009868421052632, 'support': None}, 'macro_avg': {'precision': 0.6986102090342253, 'recall': 0.7528789722785666, 'f1': 0.7213919601285329, 'support': None}, 'weighted_avg': {'precision': 0.8185273064955765, 'recall': 0.8009868421052632, 'f1': 0.8066882890940217, 'support': None}}
Loss: tensor(8.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(10.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.876993166287016, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.7237354085603113}, 'recall': {'supports': 0.9058823529411765, 'contradicts': 0.46551724137931033, 'parts_of_same': 0.744}, 'f1': {'supports': 0.8912037037037037, 'contradicts': 0.548223350253807, 'parts_of_same': 0.7337278106508877}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8305921052631579, 'recall': 0.8305921052631579, 'f1': 0.8305921052631579, 'support': None}, 'macro_avg': {'precision': 0.755798413837998, 'recall': 0.7051331981068291, 'f1': 0.7243849548694662, 'support': None}, 'weighted_avg': {'precision': 0.8254205401458673, 'recall': 0.8305921052631579, 'f1': 0.8261093827634142, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.8939393939393939, 'contradicts': 0.5407407407407407, 'parts_of_same': 0.8116591928251121}, 'recall': {'supports': 0.9023529411764706, 'contradicts': 0.6293103448275862, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8981264637002342, 'contradicts': 0.5816733067729083, 'parts_of_same': 0.7653276955602536}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8396381578947368, 'recall': 0.8396381578947368, 'f1': 0.8396381578947368, 'support': None}, 'macro_avg': {'precision': 0.7487797758350823, 'recall': 0.7518877620013523, 'f1': 0.748375822011132, 'support': None}, 'weighted_avg': {'precision': 0.8433299415959612, 'recall': 0.8396381578947368, 'f1': 0.8406361197540458, 'support': None}}
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.8695652173913043, 'contradicts': 0.68, 'parts_of_same': 0.7622950819672131}, 'recall': {'supports': 0.9176470588235294, 'contradicts': 0.4396551724137931, 'parts_of_same': 0.744}, 'f1': {'supports': 0.8929593589009731, 'contradicts': 0.5340314136125655, 'parts_of_same': 0.7530364372469635}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8363486842105263, 'recall': 0.8363486842105263, 'f1': 0.8363486842105263, 'support': None}, 'macro_avg': {'precision': 0.7706200997861724, 'recall': 0.7004340770791074, 'f1': 0.7266757365868339, 'support': None}, 'weighted_avg': {'precision': 0.8294278003901414, 'recall': 0.8363486842105263, 'f1': 0.8299524739774882, 'support': None}}
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.8707182320441988, 'contradicts': 0.6777777777777778, 'parts_of_same': 0.8054298642533937}, 'recall': {'supports': 0.9270588235294117, 'contradicts': 0.5258620689655172, 'parts_of_same': 0.712}, 'f1': {'supports': 0.898005698005698, 'contradicts': 0.5922330097087379, 'parts_of_same': 0.7558386411889597}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8445723684210527, 'recall': 0.8445723684210527, 'f1': 0.8445723684210525, 'support': None}, 'macro_avg': {'precision': 0.7846419580251235, 'recall': 0.7216402974983097, 'f1': 0.7486924496344652, 'support': None}, 'weighted_avg': {'precision': 0.8388899551999504, 'recall': 0.8445723684210527, 'f1': 0.8396081683620862, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.8880597014925373, 'contradicts': 0.6082474226804123, 'parts_of_same': 0.6253968253968254}, 'recall': {'supports': 0.84, 'contradicts': 0.5086206896551724, 'parts_of_same': 0.788}, 'f1': {'supports': 0.8633615477629987, 'contradicts': 0.5539906103286385, 'parts_of_same': 0.6973451327433628}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.7976973684210527, 'recall': 0.7976973684210527, 'f1': 0.7976973684210527, 'support': None}, 'macro_avg': {'precision': 0.7072346498565917, 'recall': 0.7122068965517242, 'f1': 0.7048990969450001, 'support': None}, 'weighted_avg': {'precision': 0.8073656691190715, 'recall': 0.7976973684210527, 'f1': 0.7997175243277234, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.8725824800910125, 'contradicts': 0.5865384615384616, 'parts_of_same': 0.7682403433476395}, 'recall': {'supports': 0.9023529411764706, 'contradicts': 0.5258620689655172, 'parts_of_same': 0.716}, 'f1': {'supports': 0.8872180451127819, 'contradicts': 0.5545454545454546, 'parts_of_same': 0.7412008281573498}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.828125, 'recall': 0.828125, 'f1': 0.828125, 'support': None}, 'macro_avg': {'precision': 0.7424537616590378, 'recall': 0.7147383367139959, 'f1': 0.7276547759385288, 'support': None}, 'weighted_avg': {'precision': 0.8238434666552074, 'recall': 0.828125, 'f1': 0.8254628438424958, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.8731257208765859, 'contradicts': 0.5826086956521739, 'parts_of_same': 0.7350427350427351}, 'recall': {'supports': 0.8905882352941177, 'contradicts': 0.5775862068965517, 'parts_of_same': 0.688}, 'f1': {'supports': 0.8817705299941759, 'contradicts': 0.58008658008658, 'parts_of_same': 0.7107438016528925}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.819078947368421, 'recall': 0.819078947368421, 'f1': 0.819078947368421, 'support': None}, 'macro_avg': {'precision': 0.7302590505238316, 'recall': 0.7187248140635564, 'f1': 0.724200303911216, 'support': None}, 'weighted_avg': {'precision': 0.8170231539485476, 'recall': 0.819078947368421, 'f1': 0.8178297238472994, 'support': None}}
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3229, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9194187582562747, 'contradicts': 0.4968152866242038, 'parts_of_same': 0.6854304635761589}, 'recall': {'supports': 0.8188235294117647, 'contradicts': 0.6724137931034483, 'parts_of_same': 0.828}, 'f1': {'supports': 0.866210329807094, 'contradicts': 0.5714285714285715, 'parts_of_same': 0.7499999999999999}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8067434210526315, 'recall': 0.8067434210526315, 'f1': 0.8067434210526315, 'support': None}, 'macro_avg': {'precision': 0.7005548361522126, 'recall': 0.773079107505071, 'f1': 0.7292129670785551, 'support': None}, 'weighted_avg': {'precision': 0.8309984651811522, 'recall': 0.8067434210526315, 'f1': 0.8141977751823554, 'support': None}}
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8756998880179171, 'contradicts': 0.6236559139784946, 'parts_of_same': 0.8}, 'recall': {'supports': 0.92, 'contradicts': 0.5, 'parts_of_same': 0.736}, 'f1': {'supports': 0.8973034997131383, 'contradicts': 0.5550239234449761, 'parts_of_same': 0.7666666666666666}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8421052631578947, 'recall': 0.8421052631578947, 'f1': 0.8421052631578947, 'support': None}, 'macro_avg': {'precision': 0.766451933998804, 'recall': 0.7186666666666666, 'f1': 0.7396646966082603, 'support': None}, 'weighted_avg': {'precision': 0.8360929200959991, 'recall': 0.8421052631578947, 'f1': 0.8377939280776738, 'support': None}}
Loss: tensor(7.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.8723640399556049, 'contradicts': 0.6222222222222222, 'parts_of_same': 0.8044444444444444}, 'recall': {'supports': 0.9247058823529412, 'contradicts': 0.4827586206896552, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8977727013135351, 'contradicts': 0.5436893203883495, 'parts_of_same': 0.7621052631578947}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8412828947368421, 'recall': 0.8412828947368421, 'f1': 0.8412828947368421, 'support': None}, 'macro_avg': {'precision': 0.7663435688740905, 'recall': 0.7104881676808654, 'f1': 0.7345224282865931, 'support': None}, 'weighted_avg': {'precision': 0.8345380944499613, 'recall': 0.8412828947368421, 'f1': 0.8361028561439368, 'support': None}}
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.8677595628415301, 'contradicts': 0.6263736263736264, 'parts_of_same': 0.8380952380952381}, 'recall': {'supports': 0.9341176470588235, 'contradicts': 0.49137931034482757, 'parts_of_same': 0.704}, 'f1': {'supports': 0.8997167138810197, 'contradicts': 0.5507246376811593, 'parts_of_same': 0.7652173913043478}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8445723684210527, 'recall': 0.8445723684210527, 'f1': 0.8445723684210525, 'support': None}, 'macro_avg': {'precision': 0.7774094757701316, 'recall': 0.7098323191345504, 'f1': 0.7385529142888423, 'support': None}, 'weighted_avg': {'precision': 0.8386338639789891, 'recall': 0.8445723684210527, 'f1': 0.8387727077269476, 'support': None}}
Loss: tensor(1.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.8762541806020067, 'contradicts': 0.6373626373626373, 'parts_of_same': 0.8026315789473685}, 'recall': {'supports': 0.9247058823529412, 'contradicts': 0.5, 'parts_of_same': 0.732}, 'f1': {'supports': 0.8998282770463651, 'contradicts': 0.5603864734299516, 'parts_of_same': 0.7656903765690377}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8445723684210527, 'recall': 0.8445723684210527, 'f1': 0.8445723684210525, 'support': None}, 'macro_avg': {'precision': 0.7720827989706708, 'recall': 0.7189019607843138, 'f1': 0.7419683756817849, 'support': None}, 'weighted_avg': {'precision': 0.8383289590317546, 'recall': 0.8445723684210527, 'f1': 0.8398696221624542, 'support': None}}
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.8754171301446051, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.801762114537445}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.5, 'parts_of_same': 0.728}, 'f1': {'supports': 0.8999428244711264, 'contradicts': 0.5631067961165049, 'parts_of_same': 0.7631027253668764}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8445723684210527, 'recall': 0.8445723684210527, 'f1': 0.8445723684210525, 'support': None}, 'macro_avg': {'precision': 0.7738745630421647, 'recall': 0.7179607843137253, 'f1': 0.7420507819848359, 'support': None}, 'weighted_avg': {'precision': 0.8382406618526572, 'recall': 0.8445723684210527, 'f1': 0.8396771961280355, 'support': None}}
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8744444444444445, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.5, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8994285714285715, 'contradicts': 0.5631067961165049, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.84375, 'recall': 0.84375, 'f1': 0.84375, 'support': None}, 'macro_avg': {'precision': 0.7732579482137005, 'recall': 0.7166274509803922, 'f1': 0.7410131897419162, 'support': None}, 'weighted_avg': {'precision': 0.8373804048284428, 'recall': 0.84375, 'f1': 0.8387834905295793, 'support': None}}
Loss: tensor(2.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.8744444444444445, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.5, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8994285714285715, 'contradicts': 0.5631067961165049, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.84375, 'recall': 0.84375, 'f1': 0.84375, 'support': None}, 'macro_avg': {'precision': 0.7732579482137005, 'recall': 0.7166274509803922, 'f1': 0.7410131897419162, 'support': None}, 'weighted_avg': {'precision': 0.8373804048284428, 'recall': 0.84375, 'f1': 0.8387834905295793, 'support': None}}
Loss: tensor(3.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8744444444444445, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.5, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8994285714285715, 'contradicts': 0.5631067961165049, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.84375, 'recall': 0.84375, 'f1': 0.84375, 'support': None}, 'macro_avg': {'precision': 0.7732579482137005, 'recall': 0.7166274509803922, 'f1': 0.7410131897419162, 'support': None}, 'weighted_avg': {'precision': 0.8373804048284428, 'recall': 0.84375, 'f1': 0.8387834905295793, 'support': None}}
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6766e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.8744444444444445, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.5, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8994285714285715, 'contradicts': 0.5631067961165049, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.84375, 'recall': 0.84375, 'f1': 0.84375, 'support': None}, 'macro_avg': {'precision': 0.7732579482137005, 'recall': 0.7166274509803922, 'f1': 0.7410131897419162, 'support': None}, 'weighted_avg': {'precision': 0.8373804048284428, 'recall': 0.84375, 'f1': 0.8387834905295793, 'support': None}}
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.8744444444444445, 'contradicts': 0.6444444444444445, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.5, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8994285714285715, 'contradicts': 0.5631067961165049, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.84375, 'recall': 0.84375, 'f1': 0.84375, 'support': None}, 'macro_avg': {'precision': 0.7732579482137005, 'recall': 0.7166274509803922, 'f1': 0.7410131897419162, 'support': None}, 'weighted_avg': {'precision': 0.8373804048284428, 'recall': 0.84375, 'f1': 0.8387834905295793, 'support': None}}
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.8734739178690344, 'contradicts': 0.6404494382022472, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.49137931034482757, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8989149057681325, 'contradicts': 0.5560975609756097, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8429276315789473, 'recall': 0.8429276315789473, 'f1': 0.8429276315789473, 'support': None}, 'macro_avg': {'precision': 0.7716027706078313, 'recall': 0.7137538877620013, 'f1': 0.7385055561414715, 'support': None}, 'weighted_avg': {'precision': 0.8363208914129877, 'recall': 0.8429276315789473, 'f1': 0.8377557873324436, 'support': None}}
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1304e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2679e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7684e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.8734739178690344, 'contradicts': 0.6404494382022472, 'parts_of_same': 0.8008849557522124}, 'recall': {'supports': 0.9258823529411765, 'contradicts': 0.49137931034482757, 'parts_of_same': 0.724}, 'f1': {'supports': 0.8989149057681325, 'contradicts': 0.5560975609756097, 'parts_of_same': 0.7605042016806722}, 'support': {'supports': 850, 'contradicts': 116, 'parts_of_same': 250}, 'micro_avg': {'precision': 0.8429276315789473, 'recall': 0.8429276315789473, 'f1': 0.8429276315789473, 'support': None}, 'macro_avg': {'precision': 0.7716027706078313, 'recall': 0.7137538877620013, 'f1': 0.7385055561414715, 'support': None}, 'weighted_avg': {'precision': 0.8363208914129877, 'recall': 0.8429276315789473, 'f1': 0.8377557873324436, 'support': None}}
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5012e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6212e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Train size: 50 Test size: 50
	Tokenizer: ../home/arg_mining/4epoch_complete/tokenizer Model: ../home/arg_mining/4epoch_complete/model/


		-------------RUN 1-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7014218009478673, 'contradicts': 0.1700404858299595, 'parts_of_same': 0.14695945945945946}, 'recall': {'supports': 0.06896551724137931, 'contradicts': 0.16153846153846155, 'parts_of_same': 0.8285714285714286}, 'f1': {'supports': 0.12558336868901143, 'contradicts': 0.16568047337278105, 'parts_of_same': 0.2496413199426112}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.19037508846426043, 'recall': 0.19037508846426043, 'f1': 0.19037508846426043, 'support': None}, 'macro_avg': {'precision': 0.3394739154124287, 'recall': 0.35302513578375655, 'f1': 0.18030172066813455, 'support': None}, 'weighted_avg': {'precision': 0.5701290460448993, 'recall': 0.19037508846426043, 'f1': 0.14770990327651745, 'support': None}}
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9550561797752809, 'contradicts': 0.44226044226044225, 'parts_of_same': 0.5151098901098901}, 'recall': {'supports': 0.7525629077353215, 'contradicts': 0.6923076923076923, 'parts_of_same': 0.8928571428571429}, 'f1': {'supports': 0.8418034923117018, 'contradicts': 0.5397301349325336, 'parts_of_same': 0.6533101045296168}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.7678697806086341, 'recall': 0.7678697806086341, 'f1': 0.7678697806086341, 'support': None}, 'macro_avg': {'precision': 0.6374755040485377, 'recall': 0.7792425809667188, 'f1': 0.6782812439246174, 'support': None}, 'weighted_avg': {'precision': 0.842492721384155, 'recall': 0.7678697806086341, 'f1': 0.7859980090183332, 'support': None}}
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9658952496954933, 'contradicts': 0.38589981447124305, 'parts_of_same': 0.5627906976744186}, 'recall': {'supports': 0.739049394221808, 'contradicts': 0.8, 'parts_of_same': 0.8642857142857143}, 'f1': {'supports': 0.8373812038014783, 'contradicts': 0.5206508135168961, 'parts_of_same': 0.6816901408450704}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.7632696390658175, 'recall': 0.7632696390658175, 'f1': 0.7632696390658175, 'support': None}, 'macro_avg': {'precision': 0.6381952539470517, 'recall': 0.8011117028358408, 'f1': 0.6799073860544816, 'support': None}, 'weighted_avg': {'precision': 0.8526246463667047, 'recall': 0.7632696390658175, 'f1': 0.7851023121115694, 'support': None}}
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9251390996459282, 'contradicts': 0.484149855907781, 'parts_of_same': 0.6434262948207171}, 'recall': {'supports': 0.8522833178005592, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.7690476190476191}, 'f1': {'supports': 0.887218045112782, 'contradicts': 0.5535420098846788, 'parts_of_same': 0.7006507592190889}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8209483368719037, 'recall': 0.8209483368719037, 'f1': 0.8209483368719037, 'support': None}, 'macro_avg': {'precision': 0.6842384167914753, 'recall': 0.7558282610006749, 'f1': 0.71380360473885, 'support': None}, 'weighted_avg': {'precision': 0.8426986957540291, 'recall': 0.8209483368719037, 'f1': 0.8287912831755359, 'support': None}}
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.941544885177453, 'contradicts': 0.505586592178771, 'parts_of_same': 0.6268115942028986}, 'recall': {'supports': 0.8406337371854613, 'contradicts': 0.6961538461538461, 'parts_of_same': 0.8238095238095238}, 'f1': {'supports': 0.8882323978335795, 'contradicts': 0.5857605177993528, 'parts_of_same': 0.7119341563786008}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8248407643312102, 'recall': 0.8248407643312102, 'f1': 0.8248407643312102, 'support': None}, 'macro_avg': {'precision': 0.6913143571863741, 'recall': 0.7868657023829438, 'f1': 0.7286423573371777, 'support': None}, 'weighted_avg': {'precision': 0.8546598397461119, 'recall': 0.8248407643312102, 'f1': 0.8342026914570791, 'support': None}}
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9373381667529778, 'contradicts': 0.5940959409594095, 'parts_of_same': 0.5705128205128205}, 'recall': {'supports': 0.8434296365330848, 'contradicts': 0.6192307692307693, 'parts_of_same': 0.8476190476190476}, 'f1': {'supports': 0.8879077753249939, 'contradicts': 0.6064030131826742, 'parts_of_same': 0.6819923371647509}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8234253361641897, 'recall': 0.8234253361641897, 'f1': 0.8234253361641897, 'support': None}, 'macro_avg': {'precision': 0.7006489760750693, 'recall': 0.770093151127634, 'f1': 0.7254343752241397, 'support': None}, 'weighted_avg': {'precision': 0.8512413429287762, 'recall': 0.8234253361641897, 'f1': 0.8314053966327415, 'support': None}}
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9090069284064665, 'contradicts': 0.5644599303135889, 'parts_of_same': 0.7566844919786097}, 'recall': {'supports': 0.9170549860205033, 'contradicts': 0.6230769230769231, 'parts_of_same': 0.6738095238095239}, 'f1': {'supports': 0.9130132219902575, 'contradicts': 0.5923217550274222, 'parts_of_same': 0.712846347607053}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8538570417551309, 'recall': 0.8538570417551309, 'f1': 0.8538570417551309, 'support': None}, 'macro_avg': {'precision': 0.7433837835662217, 'recall': 0.7379804776356501, 'f1': 0.739393774874911, 'support': None}, 'weighted_avg': {'precision': 0.8546694751850057, 'recall': 0.8538570417551309, 'f1': 0.8537599068270292, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9383149448345035, 'contradicts': 0.5617283950617284, 'parts_of_same': 0.6614173228346457}, 'recall': {'supports': 0.8718546132339235, 'contradicts': 0.7, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9038647342995169, 'contradicts': 0.6232876712328768, 'parts_of_same': 0.7241379310344829}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8453644727530077, 'recall': 0.8453644727530077, 'f1': 0.8453644727530077, 'support': None}, 'macro_avg': {'precision': 0.7204868875769592, 'recall': 0.7906182044113078, 'f1': 0.7504301121889588, 'support': None}, 'weighted_avg': {'precision': 0.8625154033692305, 'recall': 0.8453644727530077, 'f1': 0.8513398603544918, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.9456289978678039, 'contradicts': 0.4860759493670886, 'parts_of_same': 0.6162162162162163}, 'recall': {'supports': 0.8266542404473439, 'contradicts': 0.7384615384615385, 'parts_of_same': 0.8142857142857143}, 'f1': {'supports': 0.8821481849825957, 'contradicts': 0.5862595419847328, 'parts_of_same': 0.7015384615384616}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8167020523708421, 'recall': 0.8167020523708421, 'f1': 0.8167020523708421, 'support': None}, 'macro_avg': {'precision': 0.6826403878170363, 'recall': 0.7931338310648656, 'f1': 0.7233153961685966, 'support': None}, 'weighted_avg': {'precision': 0.8543915028558248, 'recall': 0.8167020523708421, 'f1': 0.8280833827794886, 'support': None}}
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9238140872065165, 'contradicts': 0.6521739130434783, 'parts_of_same': 0.6666666666666666}, 'recall': {'supports': 0.8984156570363467, 'contradicts': 0.6346153846153846, 'parts_of_same': 0.7714285714285715}, 'f1': {'supports': 0.910937869123553, 'contradicts': 0.6432748538011696, 'parts_of_same': 0.7152317880794701}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8552724699221514, 'recall': 0.8552724699221514, 'f1': 0.8552724699221514, 'support': None}, 'macro_avg': {'precision': 0.7475515556388871, 'recall': 0.7681532043601008, 'f1': 0.7564815036680642, 'support': None}, 'weighted_avg': {'precision': 0.8606051834877879, 'recall': 0.8552724699221514, 'f1': 0.857226284543817, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9146853146853147, 'contradicts': 0.6136363636363636, 'parts_of_same': 0.7266187050359713}, 'recall': {'supports': 0.9142590866728798, 'contradicts': 0.6230769230769231, 'parts_of_same': 0.7214285714285714}, 'f1': {'supports': 0.9144721510137497, 'contradicts': 0.6183206106870229, 'parts_of_same': 0.7240143369175627}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8588110403397028, 'recall': 0.8588110403397028, 'f1': 0.8588110403397028, 'support': None}, 'macro_avg': {'precision': 0.7516467944525499, 'recall': 0.7529215270594581, 'f1': 0.7522690328727784, 'support': None}, 'weighted_avg': {'precision': 0.8590375074222392, 'recall': 0.8588110403397028, 'f1': 0.8589195386976324, 'support': None}}
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9061473486625997, 'contradicts': 0.4810126582278481, 'parts_of_same': 0.8166666666666667}, 'recall': {'supports': 0.8998136067101584, 'contradicts': 0.7307692307692307, 'parts_of_same': 0.5833333333333334}, 'f1': {'supports': 0.9029693710544775, 'contradicts': 0.5801526717557252, 'parts_of_same': 0.6805555555555557}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8372257607926398, 'recall': 0.8372257607926398, 'f1': 0.8372257607926398, 'support': None}, 'macro_avg': {'precision': 0.7346088911857048, 'recall': 0.7379720569375742, 'f1': 0.7212258661219195, 'support': None}, 'weighted_avg': {'precision': 0.8537351384887402, 'recall': 0.8372257607926398, 'f1': 0.840214189056168, 'support': None}}
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9157330735509012, 'contradicts': 0.4779220779220779, 'parts_of_same': 0.7319587628865979}, 'recall': {'supports': 0.8760484622553588, 'contradicts': 0.7076923076923077, 'parts_of_same': 0.6761904761904762}, 'f1': {'supports': 0.8954512979280781, 'contradicts': 0.5705426356589147, 'parts_of_same': 0.702970297029703}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8308563340410474, 'recall': 0.8308563340410474, 'f1': 0.8308563340410474, 'support': None}, 'macro_avg': {'precision': 0.7085379714531923, 'recall': 0.7533104153793809, 'f1': 0.722988076872232, 'support': None}, 'weighted_avg': {'precision': 0.8481406923256705, 'recall': 0.8308563340410474, 'f1': 0.8369522630493449, 'support': None}}
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9418310571573091, 'contradicts': 0.5541795665634675, 'parts_of_same': 0.6615969581749049}, 'recall': {'supports': 0.8676607642124884, 'contradicts': 0.6884615384615385, 'parts_of_same': 0.8285714285714286}, 'f1': {'supports': 0.903225806451613, 'contradicts': 0.6140651801029159, 'parts_of_same': 0.7357293868921776}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8453644727530077, 'recall': 0.8453644727530077, 'f1': 0.8453644727530077, 'support': None}, 'macro_avg': {'precision': 0.7192025272985605, 'recall': 0.7948979104151519, 'f1': 0.7510067911489021, 'support': None}, 'weighted_avg': {'precision': 0.8645176427457704, 'recall': 0.8453644727530077, 'f1': 0.8517288994927934, 'support': None}}
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9254013220018886, 'contradicts': 0.5910652920962199, 'parts_of_same': 0.762589928057554}, 'recall': {'supports': 0.9133271202236719, 'contradicts': 0.6615384615384615, 'parts_of_same': 0.7571428571428571}, 'f1': {'supports': 0.9193245778611632, 'contradicts': 0.6243194192377496, 'parts_of_same': 0.7598566308243728}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8669497523000708, 'recall': 0.8669497523000708, 'f1': 0.8669497523000708, 'support': None}, 'macro_avg': {'precision': 0.7596855140518876, 'recall': 0.7773361463016636, 'f1': 0.7678335426410952, 'support': None}, 'weighted_avg': {'precision': 0.8704444383387272, 'recall': 0.8669497523000708, 'f1': 0.8684831486334422, 'support': None}}
Loss: tensor(6.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9303000968054211, 'contradicts': 0.5821917808219178, 'parts_of_same': 0.7094017094017094}, 'recall': {'supports': 0.8956197576887233, 'contradicts': 0.6538461538461539, 'parts_of_same': 0.7904761904761904}, 'f1': {'supports': 0.912630579297246, 'contradicts': 0.6159420289855073, 'parts_of_same': 0.7477477477477478}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8577494692144374, 'recall': 0.8577494692144374, 'f1': 0.8577494692144374, 'support': None}, 'macro_avg': {'precision': 0.7406311956763495, 'recall': 0.7799807006703557, 'f1': 0.7587734520101671, 'support': None}, 'weighted_avg': {'precision': 0.8654432373343419, 'recall': 0.8577494692144374, 'f1': 0.8608295133624118, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9316197866149369, 'contradicts': 0.584192439862543, 'parts_of_same': 0.7082452431289641}, 'recall': {'supports': 0.8951537744641193, 'contradicts': 0.6538461538461539, 'parts_of_same': 0.7976190476190477}, 'f1': {'supports': 0.9130228136882129, 'contradicts': 0.617059891107078, 'parts_of_same': 0.750279955207167}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8584571832979476, 'recall': 0.8584571832979476, 'f1': 0.8584571832979476, 'support': None}, 'macro_avg': {'precision': 0.7413524898688145, 'recall': 0.7822063253097736, 'f1': 0.7601208866674859, 'support': None}, 'weighted_avg': {'precision': 0.8664575720290447, 'recall': 0.8584571832979476, 'f1': 0.8616065502653063, 'support': None}}
Loss: tensor(3.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9325242718446602, 'contradicts': 0.5827586206896552, 'parts_of_same': 0.707983193277311}, 'recall': {'supports': 0.8951537744641193, 'contradicts': 0.65, 'parts_of_same': 0.8023809523809524}, 'f1': {'supports': 0.9134569662387065, 'contradicts': 0.6145454545454546, 'parts_of_same': 0.752232142857143}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8588110403397028, 'recall': 0.8588110403397028, 'f1': 0.8588110403397028, 'support': None}, 'macro_avg': {'precision': 0.7410886952705421, 'recall': 0.7825115756150239, 'f1': 0.7600781878804348, 'support': None}, 'weighted_avg': {'precision': 0.8669735562400643, 'recall': 0.8588110403397028, 'f1': 0.861995034582478, 'support': None}}
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.932491500728509, 'contradicts': 0.5807560137457045, 'parts_of_same': 0.707983193277311}, 'recall': {'supports': 0.8946877912395154, 'contradicts': 0.65, 'parts_of_same': 0.8023809523809524}, 'f1': {'supports': 0.9131985731272294, 'contradicts': 0.6134301270417424, 'parts_of_same': 0.752232142857143}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8584571832979476, 'recall': 0.8584571832979476, 'f1': 0.8584571832979476, 'support': None}, 'macro_avg': {'precision': 0.7404102359171748, 'recall': 0.7823562478734892, 'f1': 0.7596202810087048, 'support': None}, 'weighted_avg': {'precision': 0.8667644250933242, 'recall': 0.8584571832979476, 'f1': 0.8616962034543125, 'support': None}}
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9324258629071464, 'contradicts': 0.5787671232876712, 'parts_of_same': 0.7064989517819706}, 'recall': {'supports': 0.8937558247903076, 'contradicts': 0.65, 'parts_of_same': 0.8023809523809524}, 'f1': {'supports': 0.912681418034737, 'contradicts': 0.6123188405797102, 'parts_of_same': 0.7513935340022296}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8577494692144374, 'recall': 0.8577494692144374, 'f1': 0.8577494692144374, 'support': None}, 'macro_avg': {'precision': 0.7392306459922627, 'recall': 0.78204559239042, 'f1': 0.7587979308722256, 'support': None}, 'weighted_avg': {'precision': 0.8663110097671471, 'recall': 0.8577494692144374, 'f1': 0.8610766121494008, 'support': None}}
Loss: tensor(1.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.932912007778318, 'contradicts': 0.5793103448275863, 'parts_of_same': 0.7056367432150313}, 'recall': {'supports': 0.8942218080149115, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8047619047619048}, 'f1': {'supports': 0.9131572686176541, 'contradicts': 0.6109090909090908, 'parts_of_same': 0.7519466073414905}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8581033262561925, 'recall': 0.8581033262561925, 'f1': 0.8581033262561925, 'support': None}, 'macro_avg': {'precision': 0.7392863652736451, 'recall': 0.7817125196435541, 'f1': 0.7586709889560784, 'support': None}, 'weighted_avg': {'precision': 0.866602013622702, 'recall': 0.8581033262561925, 'f1': 0.8613904590138979, 'support': None}}
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.932912007778318, 'contradicts': 0.5793103448275863, 'parts_of_same': 0.7056367432150313}, 'recall': {'supports': 0.8942218080149115, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8047619047619048}, 'f1': {'supports': 0.9131572686176541, 'contradicts': 0.6109090909090908, 'parts_of_same': 0.7519466073414905}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8581033262561925, 'recall': 0.8581033262561925, 'f1': 0.8581033262561925, 'support': None}, 'macro_avg': {'precision': 0.7392863652736451, 'recall': 0.7817125196435541, 'f1': 0.7586709889560784, 'support': None}, 'weighted_avg': {'precision': 0.866602013622702, 'recall': 0.8581033262561925, 'f1': 0.8613904590138979, 'support': None}}
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7864e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.932491500728509, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7056367432150313}, 'recall': {'supports': 0.8946877912395154, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8047619047619048}, 'f1': {'supports': 0.9131985731272294, 'contradicts': 0.6131386861313869, 'parts_of_same': 0.7519466073414905}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8584571832979476, 'recall': 0.8584571832979476, 'f1': 0.8584571832979476, 'support': None}, 'macro_avg': {'precision': 0.7404871924256246, 'recall': 0.7818678473850887, 'f1': 0.759427955533369, 'support': None}, 'weighted_avg': {'precision': 0.8666528164827884, 'recall': 0.8584571832979476, 'f1': 0.8616269537893211, 'support': None}}
Loss: tensor(8.3771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9320388349514563, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7050209205020921}, 'recall': {'supports': 0.8946877912395154, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8023809523809524}, 'f1': {'supports': 0.9129814550641939, 'contradicts': 0.6131386861313869, 'parts_of_same': 0.7505567928730512}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8581033262561925, 'recall': 0.8581033262561925, 'f1': 0.8581033262561925, 'support': None}, 'macro_avg': {'precision': 0.7401310295956273, 'recall': 0.781074196591438, 'f1': 0.7588923113562106, 'support': None}, 'weighted_avg': {'precision': 0.866217548861773, 'recall': 0.8581033262561925, 'f1': 0.8612555251127396, 'support': None}}
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9315866084425036, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7044025157232704}, 'recall': {'supports': 0.8946877912395154, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9127644402186831, 'contradicts': 0.6131386861313869, 'parts_of_same': 0.7491638795986622}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8577494692144374, 'recall': 0.8577494692144374, 'f1': 0.8577494692144374, 'support': None}, 'macro_avg': {'precision': 0.7397741524997025, 'recall': 0.7802805457977872, 'f1': 0.7583556686495774, 'support': None}, 'weighted_avg': {'precision': 0.8657822310644208, 'recall': 0.8577494692144374, 'f1': 0.8608837142727858, 'support': None}}
Loss: tensor(6.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9315866084425036, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7044025157232704}, 'recall': {'supports': 0.8946877912395154, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9127644402186831, 'contradicts': 0.6131386861313869, 'parts_of_same': 0.7491638795986622}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8577494692144374, 'recall': 0.8577494692144374, 'f1': 0.8577494692144374, 'support': None}, 'macro_avg': {'precision': 0.7397741524997025, 'recall': 0.7802805457977872, 'f1': 0.7583556686495774, 'support': None}, 'weighted_avg': {'precision': 0.8657822310644208, 'recall': 0.8577494692144374, 'f1': 0.8608837142727858, 'support': None}}
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9315866084425036, 'contradicts': 0.5833333333333334, 'parts_of_same': 0.7044025157232704}, 'recall': {'supports': 0.8946877912395154, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9127644402186831, 'contradicts': 0.6131386861313869, 'parts_of_same': 0.7491638795986622}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8577494692144374, 'recall': 0.8577494692144374, 'f1': 0.8577494692144374, 'support': None}, 'macro_avg': {'precision': 0.7397741524997025, 'recall': 0.7802805457977872, 'f1': 0.7583556686495774, 'support': None}, 'weighted_avg': {'precision': 0.8657822310644208, 'recall': 0.8577494692144374, 'f1': 0.8608837142727858, 'support': None}}
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9316197866149369, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7044025157232704}, 'recall': {'supports': 0.8951537744641193, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9130228136882129, 'contradicts': 0.6142595978062158, 'parts_of_same': 0.7491638795986622}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8581033262561925, 'recall': 0.8581033262561925, 'f1': 0.8581033262561925, 'support': None}, 'macro_avg': {'precision': 0.7404627186655812, 'recall': 0.7804358735393219, 'f1': 0.7588154303643636, 'support': None}, 'weighted_avg': {'precision': 0.865994423436181, 'recall': 0.8581033262561925, 'f1': 0.8611830442448547, 'support': None}}
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9316860465116279, 'contradicts': 0.5874125874125874, 'parts_of_same': 0.7058823529411765}, 'recall': {'supports': 0.8960857409133272, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9135391923990499, 'contradicts': 0.6153846153846153, 'parts_of_same': 0.7500000000000001}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8588110403397028, 'recall': 0.8588110403397028, 'f1': 0.8588110403397028, 'support': None}, 'macro_avg': {'precision': 0.7416603289551307, 'recall': 0.7807465290223913, 'f1': 0.7596412692612217, 'support': None}, 'weighted_avg': {'precision': 0.8664529783356406, 'recall': 0.8588110403397028, 'f1': 0.8618029394509417, 'support': None}}
Loss: tensor(2.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9316529326223946, 'contradicts': 0.5853658536585366, 'parts_of_same': 0.7058823529411765}, 'recall': {'supports': 0.8956197576887233, 'contradicts': 0.6461538461538462, 'parts_of_same': 0.8}, 'f1': {'supports': 0.9132810643858399, 'contradicts': 0.6142595978062158, 'parts_of_same': 0.7500000000000001}, 'support': {'supports': 2146, 'contradicts': 260, 'parts_of_same': 420}, 'micro_avg': {'precision': 0.8584571832979476, 'recall': 0.8584571832979476, 'f1': 0.8584571832979476, 'support': None}, 'macro_avg': {'precision': 0.7409670464073693, 'recall': 0.7805912012808566, 'f1': 0.7591802207306851, 'support': None}, 'weighted_avg': {'precision': 0.8662395271033873, 'recall': 0.8584571832979476, 'f1': 0.8615034181180568, 'support': None}}
Loss: tensor(1.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 2-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7295918367346939, 'contradicts': 0.0, 'parts_of_same': 0.13848920863309352}, 'recall': {'supports': 0.806390977443609, 'contradicts': 0.0, 'parts_of_same': 0.15682281059063136}, 'f1': {'supports': 0.7660714285714286, 'contradicts': 0.0, 'parts_of_same': 0.14708691499522444}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.6165749656121046, 'recall': 0.6165749656121046, 'f1': 0.6165749656121046, 'support': None}, 'macro_avg': {'precision': 0.2893603484559291, 'recall': 0.3210712626780801, 'f1': 0.3043861145222177, 'support': None}, 'weighted_avg': {'precision': 0.5572797902373718, 'recall': 0.6165749656121046, 'f1': 0.5854262982333753, 'support': None}}
Loss: tensor(1.9982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9659011830201809, 'contradicts': 0.45320197044334976, 'parts_of_same': 0.4328638497652582}, 'recall': {'supports': 0.6522556390977443, 'contradicts': 0.6366782006920415, 'parts_of_same': 0.9389002036659878}, 'f1': {'supports': 0.7786816269284712, 'contradicts': 0.529496402877698, 'parts_of_same': 0.5925449871465295}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.6991059147180193, 'recall': 0.6991059147180193, 'f1': 0.6991059147180193, 'support': None}, 'macro_avg': {'precision': 0.6173223344095963, 'recall': 0.7426113478185913, 'f1': 0.6335743389842329, 'support': None}, 'weighted_avg': {'precision': 0.8249481558321234, 'recall': 0.6991059147180193, 'f1': 0.7224891854279186, 'support': None}}
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9593596059113301, 'contradicts': 0.4898876404494382, 'parts_of_same': 0.5220500595947557}, 'recall': {'supports': 0.7321428571428571, 'contradicts': 0.754325259515571, 'parts_of_same': 0.8920570264765784}, 'f1': {'supports': 0.8304904051172707, 'contradicts': 0.5940054495912807, 'parts_of_same': 0.6586466165413534}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.7613480055020633, 'recall': 0.7613480055020633, 'f1': 0.7613480055020633, 'support': None}, 'macro_avg': {'precision': 0.6570991019851747, 'recall': 0.7928417143783356, 'f1': 0.6943808237499681, 'support': None}, 'weighted_avg': {'precision': 0.8388656632497329, 'recall': 0.7613480055020633, 'f1': 0.7779733994990499, 'support': None}}
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9226722777485534, 'contradicts': 0.5946969696969697, 'parts_of_same': 0.5746971736204576}, 'recall': {'supports': 0.8242481203007519, 'contradicts': 0.5432525951557093, 'parts_of_same': 0.869653767820774}, 'f1': {'supports': 0.8706875155125342, 'contradicts': 0.5678119349005425, 'parts_of_same': 0.6920583468395461}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8039889958734525, 'recall': 0.8039889958734525, 'f1': 0.8039889958734524, 'support': None}, 'macro_avg': {'precision': 0.6973554736886602, 'recall': 0.7457181610924118, 'f1': 0.710185932417541, 'support': None}, 'weighted_avg': {'precision': 0.8313240521110695, 'recall': 0.8039889958734525, 'f1': 0.8104268674329942, 'support': None}}
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.920059582919563, 'contradicts': 0.6844444444444444, 'parts_of_same': 0.6113602391629297}, 'recall': {'supports': 0.8707706766917294, 'contradicts': 0.532871972318339, 'parts_of_same': 0.8329938900203666}, 'f1': {'supports': 0.8947368421052632, 'contradicts': 0.5992217898832685, 'parts_of_same': 0.7051724137931036}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8308115543328748, 'recall': 0.8308115543328748, 'f1': 0.8308115543328748, 'support': None}, 'macro_avg': {'precision': 0.7386214221756457, 'recall': 0.745545513010145, 'f1': 0.7330436819272118, 'support': None}, 'weighted_avg': {'precision': 0.8445217036885396, 'recall': 0.8308115543328748, 'f1': 0.8333613316536033, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9247417609444171, 'contradicts': 0.7071129707112971, 'parts_of_same': 0.6477987421383647}, 'recall': {'supports': 0.8834586466165414, 'contradicts': 0.5847750865051903, 'parts_of_same': 0.8391038696537678}, 'f1': {'supports': 0.9036289353520788, 'contradicts': 0.6401515151515151, 'parts_of_same': 0.7311446317657497}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8462861072902338, 'recall': 0.8462861072902338, 'f1': 0.8462861072902338, 'support': None}, 'macro_avg': {'precision': 0.7598844912646929, 'recall': 0.7691125342584998, 'f1': 0.7583083607564479, 'support': None}, 'weighted_avg': {'precision': 0.856353266236321, 'recall': 0.8462861072902338, 'f1': 0.848321243639957, 'support': None}}
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9294117647058824, 'contradicts': 0.6438848920863309, 'parts_of_same': 0.6207407407407407}, 'recall': {'supports': 0.8538533834586466, 'contradicts': 0.6193771626297578, 'parts_of_same': 0.8533604887983707}, 'f1': {'supports': 0.8900318393338232, 'contradicts': 0.6313932980599648, 'parts_of_same': 0.7186963979416809}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8304676753782668, 'recall': 0.8304676753782668, 'f1': 0.8304676753782668, 'support': None}, 'macro_avg': {'precision': 0.7313457991776513, 'recall': 0.7755303449622583, 'f1': 0.7467071784451563, 'support': None}, 'weighted_avg': {'precision': 0.8489183881742679, 'recall': 0.8304676753782668, 'f1': 0.8353990194742336, 'support': None}}
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9146806482364156, 'contradicts': 0.6161290322580645, 'parts_of_same': 0.736}, 'recall': {'supports': 0.9017857142857143, 'contradicts': 0.6608996539792388, 'parts_of_same': 0.7494908350305499}, 'f1': {'supports': 0.9081874112636064, 'contradicts': 0.6377295492487479, 'parts_of_same': 0.7426841574167506}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8521320495185695, 'recall': 0.8521320495185695, 'f1': 0.8521320495185694, 'support': None}, 'macro_avg': {'precision': 0.7556032268314933, 'recall': 0.7707254010985011, 'f1': 0.7628670393097016, 'support': None}, 'weighted_avg': {'precision': 0.8548410281188696, 'recall': 0.8521320495185695, 'f1': 0.8533647084571757, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.920665083135392, 'contradicts': 0.714859437751004, 'parts_of_same': 0.7093862815884476}, 'recall': {'supports': 0.9107142857142857, 'contradicts': 0.615916955017301, 'parts_of_same': 0.8004073319755601}, 'f1': {'supports': 0.9156626506024097, 'contradicts': 0.6617100371747211, 'parts_of_same': 0.7521531100478469}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8627922971114168, 'recall': 0.8627922971114168, 'f1': 0.8627922971114168, 'support': None}, 'macro_avg': {'precision': 0.7816369341582812, 'recall': 0.7756795242357156, 'f1': 0.7765085992749926, 'support': None}, 'weighted_avg': {'precision': 0.8645386309085564, 'recall': 0.8627922971114168, 'f1': 0.8628168838579489, 'support': None}}
Loss: tensor(3.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9186761229314421, 'contradicts': 0.7125506072874493, 'parts_of_same': 0.7142857142857143}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.6089965397923875, 'parts_of_same': 0.7942973523421588}, 'f1': {'supports': 0.9158614188074475, 'contradicts': 0.6567164179104477, 'parts_of_same': 0.7521697203471552}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8627922971114168, 'recall': 0.8627922971114168, 'f1': 0.8627922971114168, 'support': None}, 'macro_avg': {'precision': 0.7818374815015353, 'recall': 0.7721192673029941, 'f1': 0.7749158523550168, 'support': None}, 'weighted_avg': {'precision': 0.8636809493873684, 'recall': 0.8627922971114168, 'f1': 0.862468870938384, 'support': None}}
Loss: tensor(4.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9196172248803828, 'contradicts': 0.6617647058823529, 'parts_of_same': 0.7142857142857143}, 'recall': {'supports': 0.9031954887218046, 'contradicts': 0.6228373702422145, 'parts_of_same': 0.7942973523421588}, 'f1': {'supports': 0.9113323850165954, 'contradicts': 0.6417112299465241, 'parts_of_same': 0.7521697203471552}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8569463548830811, 'recall': 0.8569463548830811, 'f1': 0.856946354883081, 'support': None}, 'macro_avg': {'precision': 0.7652225483494833, 'recall': 0.773443403768726, 'f1': 0.768404445103425, 'support': None}, 'weighted_avg': {'precision': 0.8593224691402134, 'recall': 0.8569463548830811, 'f1': 0.8576634090303691, 'support': None}}
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9176136363636364, 'contradicts': 0.6961538461538461, 'parts_of_same': 0.7182835820895522}, 'recall': {'supports': 0.9107142857142857, 'contradicts': 0.6262975778546713, 'parts_of_same': 0.7841140529531568}, 'f1': {'supports': 0.9141509433962264, 'contradicts': 0.6593806921675774, 'parts_of_same': 0.7497565725413827}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8610729023383769, 'recall': 0.8610729023383769, 'f1': 0.8610729023383769, 'support': None}, 'macro_avg': {'precision': 0.7773503548690116, 'recall': 0.7737086388407045, 'f1': 0.7744294027017289, 'support': None}, 'weighted_avg': {'precision': 0.8619489403460282, 'recall': 0.8610729023383769, 'f1': 0.8610745201861824, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9176526265972551, 'contradicts': 0.6964980544747081, 'parts_of_same': 0.7156133828996283}, 'recall': {'supports': 0.9111842105263158, 'contradicts': 0.6193771626297578, 'parts_of_same': 0.7841140529531568}, 'f1': {'supports': 0.9144069794859704, 'contradicts': 0.6556776556776556, 'parts_of_same': 0.7482993197278913}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8607290233837689, 'recall': 0.8607290233837689, 'f1': 0.8607290233837689, 'support': None}, 'macro_avg': {'precision': 0.7765880213238638, 'recall': 0.7715584753697434, 'f1': 0.7727946516305058, 'support': None}, 'weighted_avg': {'precision': 0.8615608315494728, 'recall': 0.8607290233837689, 'f1': 0.8606478200905716, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9184549356223176, 'contradicts': 0.6666666666666666, 'parts_of_same': 0.7193308550185874}, 'recall': {'supports': 0.9050751879699248, 'contradicts': 0.629757785467128, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9117159763313609, 'contradicts': 0.6476868327402135, 'parts_of_same': 0.7521865889212828}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8579779917469051, 'recall': 0.8579779917469051, 'f1': 0.8579779917469053, 'support': None}, 'macro_avg': {'precision': 0.7681508191025239, 'recall': 0.7743401153819368, 'f1': 0.7705297993309524, 'support': None}, 'weighted_avg': {'precision': 0.8598109420512672, 'recall': 0.8579779917469051, 'f1': 0.8585408209956696, 'support': None}}
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9175746091899574, 'contradicts': 0.6953125, 'parts_of_same': 0.7171903881700554}, 'recall': {'supports': 0.9102443609022557, 'contradicts': 0.615916955017301, 'parts_of_same': 0.790224032586558}, 'f1': {'supports': 0.9138947865062517, 'contradicts': 0.6532110091743119, 'parts_of_same': 0.751937984496124}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8607290233837689, 'recall': 0.8607290233837689, 'f1': 0.8607290233837689, 'support': None}, 'macro_avg': {'precision': 0.7766924991200043, 'recall': 0.7721284495020383, 'f1': 0.7730145933922291, 'support': None}, 'weighted_avg': {'precision': 0.861652187567994, 'recall': 0.8607290233837689, 'f1': 0.8606422413082107, 'support': None}}
Loss: tensor(2.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9181731684110371, 'contradicts': 0.6703703703703704, 'parts_of_same': 0.7201492537313433}, 'recall': {'supports': 0.9069548872180451, 'contradicts': 0.6262975778546713, 'parts_of_same': 0.7861507128309573}, 'f1': {'supports': 0.9125295508274233, 'contradicts': 0.6475849731663685, 'parts_of_same': 0.7517039922103212}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8586657496561211, 'recall': 0.8586657496561211, 'f1': 0.8586657496561211, 'support': None}, 'macro_avg': {'precision': 0.769564264170917, 'recall': 0.7731343926345579, 'f1': 0.7706061720680376, 'support': None}, 'weighted_avg': {'precision': 0.8601110120350116, 'recall': 0.8586657496561211, 'f1': 0.859044567256226, 'support': None}}
Loss: tensor(1.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.9176526265972551, 'contradicts': 0.6911196911196911, 'parts_of_same': 0.7220149253731343}, 'recall': {'supports': 0.9111842105263158, 'contradicts': 0.6193771626297578, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9144069794859704, 'contradicts': 0.6532846715328466, 'parts_of_same': 0.7536514118792599}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8614167812929848, 'recall': 0.8614167812929848, 'f1': 0.8614167812929848, 'support': None}, 'macro_avg': {'precision': 0.7769290810300268, 'recall': 0.7729162486216105, 'f1': 0.7737810209660255, 'support': None}, 'weighted_avg': {'precision': 0.8621071899899443, 'recall': 0.8614167812929848, 'f1': 0.8613136745707891, 'support': None}}
Loss: tensor(2.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.917296786389414, 'contradicts': 0.6953125, 'parts_of_same': 0.7220149253731343}, 'recall': {'supports': 0.912124060150376, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.914703110273327, 'contradicts': 0.6532110091743119, 'parts_of_same': 0.7536514118792599}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8617606602475929, 'recall': 0.8617606602475929, 'f1': 0.8617606602475929, 'support': None}, 'macro_avg': {'precision': 0.7782080705875161, 'recall': 0.7720761292921449, 'f1': 0.7738551771089662, 'support': None}, 'weighted_avg': {'precision': 0.8622634808441824, 'recall': 0.8617606602475929, 'f1': 0.8615230548644197, 'support': None}}
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8616e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9169027384324835, 'contradicts': 0.6980392156862745, 'parts_of_same': 0.7214953271028037}, 'recall': {'supports': 0.9125939849624061, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7861507128309573}, 'f1': {'supports': 0.9147432878002826, 'contradicts': 0.6544117647058824, 'parts_of_same': 0.7524366471734893}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8617606602475929, 'recall': 0.8617606602475929, 'f1': 0.8617606602475929, 'support': None}, 'macro_avg': {'precision': 0.7788124270738539, 'recall': 0.7715538842702214, 'f1': 0.7738638998932181, 'support': None}, 'weighted_avg': {'precision': 0.862158379066415, 'recall': 0.8617606602475929, 'f1': 0.861466681637271, 'support': None}}
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9169419537517697, 'contradicts': 0.6980392156862745, 'parts_of_same': 0.7228464419475655}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7861507128309573}, 'f1': {'supports': 0.9149988226983753, 'contradicts': 0.6544117647058824, 'parts_of_same': 0.7531707317073172}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8621045392022009, 'recall': 0.8621045392022009, 'f1': 0.862104539202201, 'support': None}, 'macro_avg': {'precision': 0.7792758704618699, 'recall': 0.7717105258742315, 'f1': 0.7741937730371916, 'support': None}, 'weighted_avg': {'precision': 0.8624152042343032, 'recall': 0.8621045392022009, 'f1': 0.8617776217229833, 'support': None}}
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9169419537517697, 'contradicts': 0.6980392156862745, 'parts_of_same': 0.7228464419475655}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7861507128309573}, 'f1': {'supports': 0.9149988226983753, 'contradicts': 0.6544117647058824, 'parts_of_same': 0.7531707317073172}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8621045392022009, 'recall': 0.8621045392022009, 'f1': 0.862104539202201, 'support': None}, 'macro_avg': {'precision': 0.7792758704618699, 'recall': 0.7717105258742315, 'f1': 0.7741937730371916, 'support': None}, 'weighted_avg': {'precision': 0.8624152042343032, 'recall': 0.8621045392022009, 'f1': 0.8617776217229833, 'support': None}}
Loss: tensor(1.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.9169811320754717, 'contradicts': 0.7007874015748031, 'parts_of_same': 0.7228464419475655}, 'recall': {'supports': 0.9135338345864662, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7861507128309573}, 'f1': {'supports': 0.9152542372881355, 'contradicts': 0.6556169429097606, 'parts_of_same': 0.7531707317073172}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8624484181568088, 'recall': 0.8624484181568088, 'f1': 0.8624484181568088, 'support': None}, 'macro_avg': {'precision': 0.7802049918659467, 'recall': 0.7718671674782415, 'f1': 0.7746806373017378, 'support': None}, 'weighted_avg': {'precision': 0.862716991440157, 'recall': 0.8624484181568088, 'f1': 0.8620842994217214, 'support': None}}
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4728e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1579e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.9174138744690892, 'contradicts': 0.7035573122529645, 'parts_of_same': 0.7220149253731343}, 'recall': {'supports': 0.9135338345864662, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9154697433482459, 'contradicts': 0.6568265682656828, 'parts_of_same': 0.7536514118792599}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8627922971114168, 'recall': 0.8627922971114168, 'f1': 0.8627922971114168, 'support': None}, 'macro_avg': {'precision': 0.780995370698396, 'recall': 0.772546054104175, 'f1': 0.7753159078310627, 'support': None}, 'weighted_avg': {'precision': 0.8631685407391805, 'recall': 0.8627922971114168, 'f1': 0.8624433752773613, 'support': None}}
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.9173748819641171, 'contradicts': 0.7035573122529645, 'parts_of_same': 0.7206703910614525}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9152143193593971, 'contradicts': 0.6568265682656828, 'parts_of_same': 0.7529182879377432}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8624484181568088, 'recall': 0.8624484181568088, 'f1': 0.8624484181568088, 'support': None}, 'macro_avg': {'precision': 0.7805341950928447, 'recall': 0.7723894125001648, 'f1': 0.7749863918542744, 'support': None}, 'weighted_avg': {'precision': 0.8629129897083635, 'recall': 0.8624484181568088, 'f1': 0.8621326785429887, 'support': None}}
Loss: tensor(6.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.9173748819641171, 'contradicts': 0.7035573122529645, 'parts_of_same': 0.7206703910614525}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.615916955017301, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9152143193593971, 'contradicts': 0.6568265682656828, 'parts_of_same': 0.7529182879377432}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8624484181568088, 'recall': 0.8624484181568088, 'f1': 0.8624484181568088, 'support': None}, 'macro_avg': {'precision': 0.7805341950928447, 'recall': 0.7723894125001648, 'f1': 0.7749863918542744, 'support': None}, 'weighted_avg': {'precision': 0.8629129897083635, 'recall': 0.8624484181568088, 'f1': 0.8621326785429887, 'support': None}}
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9169419537517697, 'contradicts': 0.7023809523809523, 'parts_of_same': 0.7206703910614525}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.6124567474048442, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9149988226983753, 'contradicts': 0.654343807763401, 'parts_of_same': 0.7529182879377432}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8621045392022009, 'recall': 0.8621045392022009, 'f1': 0.862104539202201, 'support': None}, 'macro_avg': {'precision': 0.7799977657313916, 'recall': 0.7712360099626793, 'f1': 0.7740869727998398, 'support': None}, 'weighted_avg': {'precision': 0.8624792760773845, 'recall': 0.8621045392022009, 'f1': 0.8617282443339744, 'support': None}}
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9169419537517697, 'contradicts': 0.701195219123506, 'parts_of_same': 0.7193308550185874}, 'recall': {'supports': 0.9130639097744361, 'contradicts': 0.6089965397923875, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9149988226983753, 'contradicts': 0.6518518518518518, 'parts_of_same': 0.7521865889212828}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8617606602475929, 'recall': 0.8617606602475929, 'f1': 0.8617606602475929, 'support': None}, 'macro_avg': {'precision': 0.7791560092979544, 'recall': 0.7700826074251937, 'f1': 0.77301242115717, 'support': None}, 'weighted_avg': {'precision': 0.8621352633165699, 'recall': 0.8617606602475929, 'f1': 0.86135704781557, 'support': None}}
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9165487977369166, 'contradicts': 0.7028112449799196, 'parts_of_same': 0.7193308550185874}, 'recall': {'supports': 0.9135338345864662, 'contradicts': 0.6055363321799307, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9150388326665098, 'contradicts': 0.6505576208178437, 'parts_of_same': 0.7521865889212828}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8617606602475929, 'recall': 0.8617606602475929, 'f1': 0.8617606602475929, 'support': None}, 'macro_avg': {'precision': 0.7795636325784745, 'recall': 0.7690858464917181, 'f1': 0.7725943474685454, 'support': None}, 'weighted_avg': {'precision': 0.8620081640981712, 'recall': 0.8617606602475929, 'f1': 0.8612577040890781, 'support': None}}
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9165487977369166, 'contradicts': 0.7028112449799196, 'parts_of_same': 0.7193308550185874}, 'recall': {'supports': 0.9135338345864662, 'contradicts': 0.6055363321799307, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9150388326665098, 'contradicts': 0.6505576208178437, 'parts_of_same': 0.7521865889212828}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8617606602475929, 'recall': 0.8617606602475929, 'f1': 0.8617606602475929, 'support': None}, 'macro_avg': {'precision': 0.7795636325784745, 'recall': 0.7690858464917181, 'f1': 0.7725943474685454, 'support': None}, 'weighted_avg': {'precision': 0.8620081640981712, 'recall': 0.8617606602475929, 'f1': 0.8612577040890781, 'support': None}}
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7867e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9165487977369166, 'contradicts': 0.7028112449799196, 'parts_of_same': 0.7193308550185874}, 'recall': {'supports': 0.9135338345864662, 'contradicts': 0.6055363321799307, 'parts_of_same': 0.7881873727087576}, 'f1': {'supports': 0.9150388326665098, 'contradicts': 0.6505576208178437, 'parts_of_same': 0.7521865889212828}, 'support': {'supports': 2128, 'contradicts': 289, 'parts_of_same': 491}, 'micro_avg': {'precision': 0.8617606602475929, 'recall': 0.8617606602475929, 'f1': 0.8617606602475929, 'support': None}, 'macro_avg': {'precision': 0.7795636325784745, 'recall': 0.7690858464917181, 'f1': 0.7725943474685454, 'support': None}, 'weighted_avg': {'precision': 0.8620081640981712, 'recall': 0.8617606602475929, 'f1': 0.8612577040890781, 'support': None}}
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5196e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9339e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 3-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7309885931558935, 'contradicts': 0.3333333333333333, 'parts_of_same': 0.2}, 'recall': {'supports': 0.9974059662775616, 'contradicts': 0.003215434083601286, 'parts_of_same': 0.001851851851851852}, 'f1': {'supports': 0.8436642896324739, 'contradicts': 0.006369426751592356, 'parts_of_same': 0.003669724770642202}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.7297724399494311, 'recall': 0.7297724399494311, 'f1': 0.7297724399494311, 'support': None}, 'macro_avg': {'precision': 0.4214406421630756, 'recall': 0.33415775073767157, 'f1': 0.28456781371823614, 'support': None}, 'weighted_avg': {'precision': 0.6012779022238459, 'recall': 0.7297724399494311, 'f1': 0.6180019105612529, 'support': None}}
Loss: tensor(2.6397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9912109375, 'contradicts': 0.24953789279112754, 'parts_of_same': 0.44801512287334594}, 'recall': {'supports': 0.4388240380458279, 'contradicts': 0.8681672025723473, 'parts_of_same': 0.8777777777777778}, 'f1': {'supports': 0.6083308360803117, 'contradicts': 0.38765254845656855, 'parts_of_same': 0.5932415519399249}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.5559418457648546, 'recall': 0.5559418457648546, 'f1': 0.5559418457648546, 'support': None}, 'macro_avg': {'precision': 0.5629213177214912, 'recall': 0.7282563394653176, 'f1': 0.5297416454922684, 'support': None}, 'weighted_avg': {'precision': 0.825602196411867, 'recall': 0.5559418457648546, 'f1': 0.5840643503385946, 'support': None}}
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.8844884488448845, 'contradicts': 0.645933014354067, 'parts_of_same': 0.7570621468926554}, 'recall': {'supports': 0.9269347168179853, 'contradicts': 0.4340836012861736, 'parts_of_same': 0.7444444444444445}, 'f1': {'supports': 0.9052142706354234, 'contradicts': 0.5192307692307693, 'parts_of_same': 0.7507002801120449}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8473451327433629, 'recall': 0.8473451327433629, 'f1': 0.8473451327433629, 'support': None}, 'macro_avg': {'precision': 0.7624945366972024, 'recall': 0.7018209208495345, 'f1': 0.7250484399927458, 'support': None}, 'weighted_avg': {'precision': 0.8392921962592815, 'recall': 0.8473451327433629, 'f1': 0.840903770060369, 'support': None}}
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.8974812196199735, 'contradicts': 0.5140449438202247, 'parts_of_same': 0.7339449541284404}, 'recall': {'supports': 0.8780804150453956, 'contradicts': 0.5884244372990354, 'parts_of_same': 0.7407407407407407}, 'f1': {'supports': 0.8876748251748252, 'contradicts': 0.5487256371814093, 'parts_of_same': 0.7373271889400922}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8261694058154235, 'recall': 0.8261694058154235, 'f1': 0.8261694058154235, 'support': None}, 'macro_avg': {'precision': 0.7151570391895462, 'recall': 0.7357485310283906, 'f1': 0.7245758837654422, 'support': None}, 'weighted_avg': {'precision': 0.831881262243504, 'recall': 0.8261694058154235, 'f1': 0.8286985543048163, 'support': None}}
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.9018053720827829, 'contradicts': 0.6351931330472103, 'parts_of_same': 0.6590909090909091}, 'recall': {'supports': 0.885430177258971, 'contradicts': 0.4758842443729904, 'parts_of_same': 0.8055555555555556}, 'f1': {'supports': 0.893542757417103, 'contradicts': 0.5441176470588235, 'parts_of_same': 0.7250000000000001}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8315423514538559, 'recall': 0.8315423514538559, 'f1': 0.8315423514538559, 'support': None}, 'macro_avg': {'precision': 0.7320298047403008, 'recall': 0.7222899923958389, 'f1': 0.7208868014919755, 'support': None}, 'weighted_avg': {'precision': 0.8341750887845292, 'recall': 0.8315423514538559, 'f1': 0.8304314115490056, 'support': None}}
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9071395240317313, 'contradicts': 0.6036036036036037, 'parts_of_same': 0.55819774718398}, 'recall': {'supports': 0.8404669260700389, 'contradicts': 0.43086816720257237, 'parts_of_same': 0.825925925925926}, 'f1': {'supports': 0.8725314183123878, 'contradicts': 0.5028142589118199, 'parts_of_same': 0.6661687826736371}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.797724399494311, 'recall': 0.797724399494311, 'f1': 0.797724399494311, 'support': None}, 'macro_avg': {'precision': 0.689646958273105, 'recall': 0.6990870063995125, 'f1': 0.6805048199659481, 'support': None}, 'weighted_avg': {'precision': 0.8177500705706272, 'recall': 0.797724399494311, 'f1': 0.8009707799373872, 'support': None}}
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.9052028218694885, 'contradicts': 0.5992063492063492, 'parts_of_same': 0.687888198757764}, 'recall': {'supports': 0.8875918720276696, 'contradicts': 0.4855305466237942, 'parts_of_same': 0.8203703703703704}, 'f1': {'supports': 0.8963108491595722, 'contradicts': 0.536412078152753, 'parts_of_same': 0.7483108108108107}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8365992414664981, 'recall': 0.8365992414664981, 'f1': 0.8365992414664981, 'support': None}, 'macro_avg': {'precision': 0.730765789944534, 'recall': 0.7311642630072782, 'f1': 0.7270112460410454, 'support': None}, 'weighted_avg': {'precision': 0.8380363239306239, 'recall': 0.8365992414664981, 'f1': 0.8356760392697328, 'support': None}}
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9146110056925996, 'contradicts': 0.6558704453441295, 'parts_of_same': 0.5747836835599506}, 'recall': {'supports': 0.8335495028102032, 'contradicts': 0.5209003215434084, 'parts_of_same': 0.8611111111111112}, 'f1': {'supports': 0.872200859534042, 'contradicts': 0.5806451612903226, 'parts_of_same': 0.6893995552260935}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8075221238938053, 'recall': 0.8075221238938053, 'f1': 0.8075221238938053, 'support': None}, 'macro_avg': {'precision': 0.7150883781988933, 'recall': 0.7385203118215742, 'f1': 0.714081858683486, 'support': None}, 'weighted_avg': {'precision': 0.8311802003133314, 'recall': 0.8075221238938053, 'f1': 0.8123441823911568, 'support': None}}
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.898397976391231, 'contradicts': 0.6877828054298643, 'parts_of_same': 0.7408056042031523}, 'recall': {'supports': 0.9213143104193687, 'contradicts': 0.4887459807073955, 'parts_of_same': 0.7833333333333333}, 'f1': {'supports': 0.9097118463180363, 'contradicts': 0.5714285714285714, 'parts_of_same': 0.7614761476147615}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8552465233881164, 'recall': 0.8552465233881164, 'f1': 0.8552465233881164, 'support': None}, 'macro_avg': {'precision': 0.7756621286747492, 'recall': 0.7311312081533657, 'f1': 0.7475388551204564, 'support': None}, 'weighted_avg': {'precision': 0.8507996201489592, 'recall': 0.8552465233881164, 'f1': 0.8511614747028681, 'support': None}}
Loss: tensor(7.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1393e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9070567986230637, 'contradicts': 0.6374045801526718, 'parts_of_same': 0.759515570934256}, 'recall': {'supports': 0.9113705144833549, 'contradicts': 0.5369774919614148, 'parts_of_same': 0.812962962962963}, 'f1': {'supports': 0.9092085400043131, 'contradicts': 0.5828970331588132, 'parts_of_same': 0.7853309481216458}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8577749683944375, 'recall': 0.8577749683944375, 'f1': 0.8577749683944375, 'support': None}, 'macro_avg': {'precision': 0.767992316569997, 'recall': 0.7537703231359109, 'f1': 0.759145507094924, 'support': None}, 'weighted_avg': {'precision': 0.855370925394161, 'recall': 0.8577749683944375, 'f1': 0.8559921119873753, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.9026431718061674, 'contradicts': 0.53315649867374, 'parts_of_same': 0.7717601547388782}, 'recall': {'supports': 0.8858625162127107, 'contradicts': 0.6463022508038585, 'parts_of_same': 0.7388888888888889}, 'f1': {'supports': 0.8941741217543094, 'contradicts': 0.5843023255813953, 'parts_of_same': 0.7549668874172185}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8372313527180784, 'recall': 0.8372313527180784, 'f1': 0.8372313527180784, 'support': None}, 'macro_avg': {'precision': 0.7358532750729285, 'recall': 0.7570178853018193, 'f1': 0.7444811115843076, 'support': None}, 'weighted_avg': {'precision': 0.8439872980512619, 'recall': 0.8372313527180784, 'f1': 0.8399572964850915, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9117514633048176, 'contradicts': 0.647887323943662, 'parts_of_same': 0.6219178082191781}, 'recall': {'supports': 0.8754863813229572, 'contradicts': 0.4437299035369775, 'parts_of_same': 0.8407407407407408}, 'f1': {'supports': 0.8932509925011027, 'contradicts': 0.5267175572519084, 'parts_of_same': 0.7149606299212599}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.827117572692794, 'recall': 0.827117572692794, 'f1': 0.827117572692794, 'support': None}, 'macro_avg': {'precision': 0.7271855318225526, 'recall': 0.7199856752002253, 'f1': 0.7116430598914235, 'support': None}, 'weighted_avg': {'precision': 0.8363494654895318, 'recall': 0.827117572692794, 'f1': 0.8267943887856746, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.889760348583878, 'contradicts': 0.6833333333333333, 'parts_of_same': 0.6114819759679573}, 'recall': {'supports': 0.8828361435365326, 'contradicts': 0.26366559485530544, 'parts_of_same': 0.8481481481481481}, 'f1': {'supports': 0.8862847222222222, 'contradicts': 0.38051044083526675, 'parts_of_same': 0.7106283941039565}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.816055625790139, 'recall': 0.816055625790139, 'f1': 0.816055625790139, 'support': None}, 'macro_avg': {'precision': 0.7281918859617228, 'recall': 0.6648832955133287, 'f1': 0.6591411857204817, 'support': None}, 'weighted_avg': {'precision': 0.8219761757155101, 'recall': 0.816055625790139, 'f1': 0.8065912270593883, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9045293072824157, 'contradicts': 0.5369774919614148, 'parts_of_same': 0.7121464226289518}, 'recall': {'supports': 0.880674448767834, 'contradicts': 0.5369774919614148, 'parts_of_same': 0.7925925925925926}, 'f1': {'supports': 0.8924424972617744, 'contradicts': 0.5369774919614148, 'parts_of_same': 0.7502191060473269}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.831858407079646, 'recall': 0.831858407079646, 'f1': 0.831858407079646, 'support': None}, 'macro_avg': {'precision': 0.7178844072909274, 'recall': 0.7367481777739471, 'f1': 0.7265463650901719, 'support': None}, 'weighted_avg': {'precision': 0.8355674323526743, 'recall': 0.831858407079646, 'f1': 0.8332293974184705, 'support': None}}
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.8828678616090038, 'contradicts': 0.6743119266055045, 'parts_of_same': 0.7148080438756855}, 'recall': {'supports': 0.9156939040207522, 'contradicts': 0.47266881028938906, 'parts_of_same': 0.7240740740740741}, 'f1': {'supports': 0.898981324278438, 'contradicts': 0.555765595463138, 'parts_of_same': 0.7194112235510579}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8394437420986094, 'recall': 0.8394437420986094, 'f1': 0.8394437420986094, 'support': None}, 'macro_avg': {'precision': 0.757329277363398, 'recall': 0.7041455961280718, 'f1': 0.7247193810975446, 'support': None}, 'weighted_avg': {'precision': 0.8336854351355272, 'recall': 0.8394437420986094, 'f1': 0.8345982819098086, 'support': None}}
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9232293214462606, 'contradicts': 0.4223744292237443, 'parts_of_same': 0.637906647807638}, 'recall': {'supports': 0.8058798097708604, 'contradicts': 0.594855305466238, 'parts_of_same': 0.8351851851851851}, 'f1': {'supports': 0.8605724838411819, 'contradicts': 0.4939919893190921, 'parts_of_same': 0.7233360064153969}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.7901390644753477, 'recall': 0.7901390644753477, 'f1': 0.7901390644753477, 'support': None}, 'macro_avg': {'precision': 0.6611701328258809, 'recall': 0.7453067668074279, 'f1': 0.6926334931918903, 'support': None}, 'weighted_avg': {'precision': 0.8253026099272786, 'recall': 0.7901390644753477, 'f1': 0.8011179226508236, 'support': None}}
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(12.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.8970840480274442, 'contradicts': 0.5808580858085809, 'parts_of_same': 0.7561436672967864}, 'recall': {'supports': 0.9044530912235192, 'contradicts': 0.5659163987138264, 'parts_of_same': 0.7407407407407407}, 'f1': {'supports': 0.9007534983853607, 'contradicts': 0.5732899022801303, 'parts_of_same': 0.7483629560336763}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.843236409608091, 'recall': 0.843236409608091, 'f1': 0.843236409608091, 'support': None}, 'macro_avg': {'precision': 0.7446952670442705, 'recall': 0.737036743559362, 'f1': 0.7408021188997225, 'support': None}, 'weighted_avg': {'precision': 0.8419468546505093, 'recall': 0.843236409608091, 'f1': 0.842557521375678, 'support': None}}
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.8794354838709677, 'contradicts': 0.6818181818181818, 'parts_of_same': 0.8103448275862069}, 'recall': {'supports': 0.9429312581063554, 'contradicts': 0.48231511254019294, 'parts_of_same': 0.6962962962962963}, 'f1': {'supports': 0.910077195910703, 'contradicts': 0.5649717514124294, 'parts_of_same': 0.749003984063745}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8555625790139064, 'recall': 0.8555625790139064, 'f1': 0.8555625790139064, 'support': None}, 'macro_avg': {'precision': 0.7905328310917854, 'recall': 0.7071808889809482, 'f1': 0.7413509771289591, 'support': None}, 'weighted_avg': {'precision': 0.8482193222615532, 'recall': 0.8555625790139064, 'f1': 0.8486652718789961, 'support': None}}
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8892092257001647, 'contradicts': 0.6767241379310345, 'parts_of_same': 0.7916666666666666}, 'recall': {'supports': 0.9334198011240813, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7388888888888889}, 'f1': {'supports': 0.9107783168107993, 'contradicts': 0.578268876611418, 'parts_of_same': 0.764367816091954}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8580910240202275, 'recall': 0.8580910240202275, 'f1': 0.8580910240202275, 'support': None}, 'macro_avg': {'precision': 0.7858666767659552, 'recall': 0.7257106137127907, 'f1': 0.7511383365047237, 'support': None}, 'weighted_avg': {'precision': 0.8516757730534237, 'recall': 0.8580910240202275, 'f1': 0.8531069810680104, 'support': None}}
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.893050353724511, 'contradicts': 0.6767241379310345, 'parts_of_same': 0.7674858223062382}, 'recall': {'supports': 0.9277993947254648, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7518518518518519}, 'f1': {'supports': 0.9100932994062766, 'contradicts': 0.578268876611418, 'parts_of_same': 0.7595884003741815}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8561946902654868, 'recall': 0.8561946902654868, 'f1': 0.8561946902654868, 'support': None}, 'macro_avg': {'precision': 0.7790867713205945, 'recall': 0.7281581325675729, 'f1': 0.7493168587972919, 'support': None}, 'weighted_avg': {'precision': 0.8503568328403016, 'recall': 0.8561946902654868, 'f1': 0.8517905051690665, 'support': None}}
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7682e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.8934221482098251, 'contradicts': 0.6738197424892703, 'parts_of_same': 0.7674858223062382}, 'recall': {'supports': 0.9277993947254648, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7518518518518519}, 'f1': {'supports': 0.9102863202545068, 'contradicts': 0.5772058823529411, 'parts_of_same': 0.7595884003741815}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8561946902654868, 'recall': 0.8561946902654868, 'f1': 0.8561946902654868, 'support': None}, 'macro_avg': {'precision': 0.778242571001778, 'recall': 0.7281581325675729, 'f1': 0.7490268676605432, 'support': None}, 'weighted_avg': {'precision': 0.8503431456285896, 'recall': 0.8561946902654868, 'f1': 0.8518271252725971, 'support': None}}
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.893377759266972, 'contradicts': 0.6709401709401709, 'parts_of_same': 0.7674858223062382}, 'recall': {'supports': 0.9273670557717251, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7518518518518519}, 'f1': {'supports': 0.9100551548578701, 'contradicts': 0.5761467889908256, 'parts_of_same': 0.7595884003741815}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8558786346396966, 'recall': 0.8558786346396966, 'f1': 0.8558786346396965, 'support': None}, 'macro_avg': {'precision': 0.7772679175044604, 'recall': 0.7280140195829929, 'f1': 0.7485967814076258, 'support': None}, 'weighted_avg': {'precision': 0.8500276530949014, 'recall': 0.8558786346396966, 'f1': 0.8515540331113965, 'support': None}}
Loss: tensor(5.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.893377759266972, 'contradicts': 0.6709401709401709, 'parts_of_same': 0.7674858223062382}, 'recall': {'supports': 0.9273670557717251, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7518518518518519}, 'f1': {'supports': 0.9100551548578701, 'contradicts': 0.5761467889908256, 'parts_of_same': 0.7595884003741815}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8558786346396966, 'recall': 0.8558786346396966, 'f1': 0.8558786346396965, 'support': None}, 'macro_avg': {'precision': 0.7772679175044604, 'recall': 0.7280140195829929, 'f1': 0.7485967814076258, 'support': None}, 'weighted_avg': {'precision': 0.8500276530949014, 'recall': 0.8558786346396966, 'f1': 0.8515540331113965, 'support': None}}
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8933333333333333, 'contradicts': 0.6680851063829787, 'parts_of_same': 0.7674858223062382}, 'recall': {'supports': 0.9269347168179853, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7518518518518519}, 'f1': {'supports': 0.9098238913643115, 'contradicts': 0.5750915750915752, 'parts_of_same': 0.7595884003741815}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8555625790139064, 'recall': 0.8555625790139064, 'f1': 0.8555625790139064, 'support': None}, 'macro_avg': {'precision': 0.7763014206741833, 'recall': 0.727869906598413, 'f1': 0.7481679556100227, 'support': None}, 'weighted_avg': {'precision': 0.8497145423926911, 'recall': 0.8555625790139064, 'f1': 0.8512812505629551, 'support': None}}
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.893705710712797, 'contradicts': 0.6680851063829787, 'parts_of_same': 0.7679245283018868}, 'recall': {'supports': 0.9269347168179853, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7537037037037037}, 'f1': {'supports': 0.9100169779286927, 'contradicts': 0.5750915750915752, 'parts_of_same': 0.7607476635514018}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8558786346396966, 'recall': 0.8558786346396966, 'f1': 0.8558786346396965, 'support': None}, 'macro_avg': {'precision': 0.7765717817992209, 'recall': 0.7284871905490302, 'f1': 0.7486187388572233, 'support': None}, 'weighted_avg': {'precision': 0.8500616378782632, 'recall': 0.8558786346396966, 'f1': 0.8516202554109681, 'support': None}}
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8936613844870726, 'contradicts': 0.6652542372881356, 'parts_of_same': 0.7679245283018868}, 'recall': {'supports': 0.9265023778642456, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7537037037037037}, 'f1': {'supports': 0.9097856081511357, 'contradicts': 0.5740402193784279, 'parts_of_same': 0.7607476635514018}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8555625790139064, 'recall': 0.8555625790139064, 'f1': 0.8555625790139064, 'support': None}, 'macro_avg': {'precision': 0.7756133833590316, 'recall': 0.7283430775644503, 'f1': 0.748191163693655, 'support': None}, 'weighted_avg': {'precision': 0.849750978318024, 'recall': 0.8555625790139064, 'f1': 0.8513477743988701, 'support': None}}
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.8936613844870726, 'contradicts': 0.6652542372881356, 'parts_of_same': 0.7679245283018868}, 'recall': {'supports': 0.9265023778642456, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7537037037037037}, 'f1': {'supports': 0.9097856081511357, 'contradicts': 0.5740402193784279, 'parts_of_same': 0.7607476635514018}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8555625790139064, 'recall': 0.8555625790139064, 'f1': 0.8555625790139064, 'support': None}, 'macro_avg': {'precision': 0.7756133833590316, 'recall': 0.7283430775644503, 'f1': 0.748191163693655, 'support': None}, 'weighted_avg': {'precision': 0.849750978318024, 'recall': 0.8555625790139064, 'f1': 0.8513477743988701, 'support': None}}
Loss: tensor(2.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.8940783986655546, 'contradicts': 0.6652542372881356, 'parts_of_same': 0.7679245283018868}, 'recall': {'supports': 0.9269347168179853, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7537037037037037}, 'f1': {'supports': 0.9102101464657186, 'contradicts': 0.5740402193784279, 'parts_of_same': 0.7607476635514018}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8558786346396966, 'recall': 0.8558786346396966, 'f1': 0.8558786346396965, 'support': None}, 'macro_avg': {'precision': 0.7757523880851923, 'recall': 0.7284871905490302, 'f1': 0.7483326764651826, 'support': None}, 'weighted_avg': {'precision': 0.850055830971257, 'recall': 0.8558786346396966, 'f1': 0.851658127471446, 'support': None}}
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.8940783986655546, 'contradicts': 0.6652542372881356, 'parts_of_same': 0.7679245283018868}, 'recall': {'supports': 0.9269347168179853, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7537037037037037}, 'f1': {'supports': 0.9102101464657186, 'contradicts': 0.5740402193784279, 'parts_of_same': 0.7607476635514018}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8558786346396966, 'recall': 0.8558786346396966, 'f1': 0.8558786346396965, 'support': None}, 'macro_avg': {'precision': 0.7757523880851923, 'recall': 0.7284871905490302, 'f1': 0.7483326764651826, 'support': None}, 'weighted_avg': {'precision': 0.850055830971257, 'recall': 0.8558786346396966, 'f1': 0.851658127471446, 'support': None}}
Loss: tensor(2.2823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.893705710712797, 'contradicts': 0.6652542372881356, 'parts_of_same': 0.7674858223062382}, 'recall': {'supports': 0.9269347168179853, 'contradicts': 0.5048231511254019, 'parts_of_same': 0.7518518518518519}, 'f1': {'supports': 0.9100169779286927, 'contradicts': 0.5740402193784279, 'parts_of_same': 0.7595884003741815}, 'support': {'supports': 2313, 'contradicts': 311, 'parts_of_same': 540}, 'micro_avg': {'precision': 0.8555625790139064, 'recall': 0.8555625790139064, 'f1': 0.8555625790139064, 'support': None}, 'macro_avg': {'precision': 0.7754819234357235, 'recall': 0.727869906598413, 'f1': 0.7478818658937674, 'support': None}, 'weighted_avg': {'precision': 0.8497085084452206, 'recall': 0.8555625790139064, 'f1': 0.8513190626984245, 'support': None}}
Loss: tensor(3.6998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 4-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.47619047619047616, 'contradicts': 0.09387605427209388, 'parts_of_same': 0.0}, 'recall': {'supports': 0.004859086491739553, 'contradicts': 0.9884169884169884, 'parts_of_same': 0.0}, 'f1': {'supports': 0.009620009620009619, 'contradicts': 0.17146684527796383, 'parts_of_same': 0.0}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.09679767103347889, 'recall': 0.09679767103347889, 'f1': 0.09679767103347889, 'support': None}, 'macro_avg': {'precision': 0.19002217682085668, 'recall': 0.331092024969576, 'f1': 0.06036228496599114, 'support': None}, 'weighted_avg': {'precision': 0.36547085082113256, 'recall': 0.09679767103347889, 'f1': 0.023365317585506706, 'support': None}}
Loss: tensor(1.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9793459552495697, 'contradicts': 0.5631067961165048, 'parts_of_same': 0.2805124747134187}, 'recall': {'supports': 0.5529640427599611, 'contradicts': 0.22393822393822393, 'parts_of_same': 0.9651972157772621}, 'f1': {'supports': 0.706832298136646, 'contradicts': 0.32044198895027626, 'parts_of_same': 0.4346917450365726}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.586608442503639, 'recall': 0.586608442503639, 'f1': 0.586608442503639, 'support': None}, 'macro_avg': {'precision': 0.6076550753598311, 'recall': 0.5806998274918157, 'f1': 0.4873220107078316, 'support': None}, 'weighted_avg': {'precision': 0.8305092840972609, 'recall': 0.586608442503639, 'f1': 0.6277319821012015, 'support': None}}
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9601046435578809, 'contradicts': 0.3190271816881259, 'parts_of_same': 0.6307692307692307}, 'recall': {'supports': 0.7133138969873664, 'contradicts': 0.861003861003861, 'parts_of_same': 0.7610208816705336}, 'f1': {'supports': 0.8185112907722331, 'contradicts': 0.4655532359081419, 'parts_of_same': 0.6898002103049421}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.7347161572052402, 'recall': 0.7347161572052402, 'f1': 0.7347161572052403, 'support': None}, 'macro_avg': {'precision': 0.6366336853384126, 'recall': 0.778446213220587, 'f1': 0.6579549123284391, 'support': None}, 'weighted_avg': {'precision': 0.8480294523147314, 'recall': 0.7347161572052402, 'f1': 0.7650576474348233, 'support': None}}
Loss: tensor(0.1521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0705, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1955, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7719, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9246332827516439, 'contradicts': 0.6212121212121212, 'parts_of_same': 0.6824457593688363}, 'recall': {'supports': 0.8882410106899903, 'contradicts': 0.6332046332046332, 'parts_of_same': 0.802784222737819}, 'f1': {'supports': 0.9060718711276332, 'contradicts': 0.627151051625239, 'parts_of_same': 0.7377398720682302}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8508005822416302, 'recall': 0.8508005822416302, 'f1': 0.8508005822416302, 'support': None}, 'macro_avg': {'precision': 0.7427637211108671, 'recall': 0.7747432888774807, 'f1': 0.7569875982737008, 'support': None}, 'weighted_avg': {'precision': 0.8580507123671001, 'recall': 0.8508005822416302, 'f1': 0.8533820662347211, 'support': None}}
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.921025641025641, 'contradicts': 0.5339233038348082, 'parts_of_same': 0.7080610021786492}, 'recall': {'supports': 0.8726919339164237, 'contradicts': 0.6988416988416989, 'parts_of_same': 0.7540603248259861}, 'f1': {'supports': 0.8962075848303394, 'contradicts': 0.6053511705685619, 'parts_of_same': 0.7303370786516854}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8377001455604076, 'recall': 0.8377001455604076, 'f1': 0.8377001455604075, 'support': None}, 'macro_avg': {'precision': 0.7210033156796994, 'recall': 0.7751979858613695, 'f1': 0.7439652780168622, 'support': None}, 'weighted_avg': {'precision': 0.8511394457288872, 'recall': 0.8377001455604076, 'f1': 0.8427789096277193, 'support': None}}
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.9039111540318686, 'contradicts': 0.5233333333333333, 'parts_of_same': 0.8116710875331565}, 'recall': {'supports': 0.9096209912536443, 'contradicts': 0.6061776061776062, 'parts_of_same': 0.7099767981438515}, 'f1': {'supports': 0.906757084039719, 'contradicts': 0.5617173524150267, 'parts_of_same': 0.7574257425742575}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8497088791848617, 'recall': 0.8497088791848617, 'f1': 0.8497088791848617, 'support': None}, 'macro_avg': {'precision': 0.7463051916327862, 'recall': 0.7419251318583674, 'f1': 0.7419667263430011, 'support': None}, 'weighted_avg': {'precision': 0.8535745003849016, 'recall': 0.8497088791848617, 'f1': 0.8508156362004142, 'support': None}}
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0846, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.8999028182701652, 'contradicts': 0.5218855218855218, 'parts_of_same': 0.7608142493638677}, 'recall': {'supports': 0.8999028182701652, 'contradicts': 0.5984555984555985, 'parts_of_same': 0.6937354988399071}, 'f1': {'supports': 0.8999028182701652, 'contradicts': 0.5575539568345322, 'parts_of_same': 0.7257281553398057}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.839155749636099, 'recall': 0.839155749636099, 'f1': 0.839155749636099, 'support': None}, 'macro_avg': {'precision': 0.7275341965065182, 'recall': 0.7306979718552237, 'f1': 0.7277283101481676, 'support': None}, 'weighted_avg': {'precision': 0.8424597131165127, 'recall': 0.839155749636099, 'f1': 0.8403185261177584, 'support': None}}
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.9333691563675444, 'contradicts': 0.5060240963855421, 'parts_of_same': 0.6360360360360361}, 'recall': {'supports': 0.8440233236151603, 'contradicts': 0.6486486486486487, 'parts_of_same': 0.8190255220417634}, 'f1': {'supports': 0.8864506251594795, 'contradicts': 0.5685279187817258, 'parts_of_same': 0.716024340770791}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8216885007278021, 'recall': 0.8216885007278021, 'f1': 0.821688500727802, 'support': None}, 'macro_avg': {'precision': 0.6918097629297075, 'recall': 0.7705658314351909, 'f1': 0.7236676282373321, 'support': None}, 'weighted_avg': {'precision': 0.8464576041847864, 'recall': 0.8216885007278021, 'f1': 0.8297564077201189, 'support': None}}
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0870, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.908084696823869, 'contradicts': 0.6425531914893617, 'parts_of_same': 0.7425287356321839}, 'recall': {'supports': 0.9169096209912536, 'contradicts': 0.583011583011583, 'parts_of_same': 0.7494199535962877}, 'f1': {'supports': 0.9124758220502901, 'contradicts': 0.6113360323886641, 'parts_of_same': 0.745958429561201}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.7643888746484716, 'recall': 0.7497803858663747, 'f1': 0.7565900946667184, 'support': None}, 'weighted_avg': {'precision': 0.8570922371603853, 'recall': 0.8591703056768559, 'f1': 0.8579764764588932, 'support': None}}
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.9093525179856116, 'contradicts': 0.6502057613168725, 'parts_of_same': 0.7666666666666667}, 'recall': {'supports': 0.9212827988338192, 'contradicts': 0.61003861003861, 'parts_of_same': 0.7470997679814385}, 'f1': {'supports': 0.9152787834902246, 'contradicts': 0.6294820717131475, 'parts_of_same': 0.7567567567567568}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8646288209606987, 'recall': 0.8646288209606987, 'f1': 0.8646288209606987, 'support': None}, 'macro_avg': {'precision': 0.7754083153230503, 'recall': 0.7594737256179559, 'f1': 0.7671725373200431, 'support': None}, 'weighted_avg': {'precision': 0.8625488018663726, 'recall': 0.8646288209606987, 'f1': 0.8634795324449598, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.925777331995988, 'contradicts': 0.6326530612244898, 'parts_of_same': 0.68762278978389}, 'recall': {'supports': 0.8969873663751214, 'contradicts': 0.5984555984555985, 'parts_of_same': 0.8120649651972158}, 'f1': {'supports': 0.9111549851924976, 'contradicts': 0.6150793650793652, 'parts_of_same': 0.7446808510638298}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8555312954876274, 'recall': 0.8555312954876274, 'f1': 0.8555312954876274, 'support': None}, 'macro_avg': {'precision': 0.7486843943347893, 'recall': 0.7691693100093119, 'f1': 0.7569717337785642, 'support': None}, 'weighted_avg': {'precision': 0.8607977854809834, 'recall': 0.8555312954876274, 'f1': 0.8571397241230808, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.9178957718780728, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.7139830508474576}, 'recall': {'supports': 0.9071914480077745, 'contradicts': 0.5945945945945946, 'parts_of_same': 0.7819025522041764}, 'f1': {'supports': 0.912512218963832, 'contradicts': 0.6147704590818364, 'parts_of_same': 0.7464008859357697}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8580786026200873, 'recall': 0.8580786026200873, 'f1': 0.8580786026200873, 'support': None}, 'macro_avg': {'precision': 0.7560808196963889, 'recall': 0.7612295316021819, 'f1': 0.7578945213271461, 'support': None}, 'weighted_avg': {'precision': 0.8593793214186719, 'recall': 0.8580786026200873, 'f1': 0.8583968258253561, 'support': None}}
Loss: tensor(5.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.9178957718780728, 'contradicts': 0.6378600823045267, 'parts_of_same': 0.7154989384288747}, 'recall': {'supports': 0.9071914480077745, 'contradicts': 0.5984555984555985, 'parts_of_same': 0.7819025522041764}, 'f1': {'supports': 0.912512218963832, 'contradicts': 0.6175298804780877, 'parts_of_same': 0.7472283813747228}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8584425036390102, 'recall': 0.8584425036390102, 'f1': 0.8584425036390102, 'support': None}, 'macro_avg': {'precision': 0.7570849308704913, 'recall': 0.7625165328891831, 'f1': 0.7590901602722141, 'support': None}, 'weighted_avg': {'precision': 0.8597581158314378, 'recall': 0.8584425036390102, 'f1': 0.8587866877888998, 'support': None}}
Loss: tensor(9.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.9174447174447175, 'contradicts': 0.6378600823045267, 'parts_of_same': 0.7148936170212766}, 'recall': {'supports': 0.9071914480077745, 'contradicts': 0.5984555984555985, 'parts_of_same': 0.7795823665893271}, 'f1': {'supports': 0.912289274370877, 'contradicts': 0.6175298804780877, 'parts_of_same': 0.7458379578246394}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8580786026200873, 'recall': 0.8580786026200873, 'f1': 0.8580786026200873, 'support': None}, 'macro_avg': {'precision': 0.7567328055901736, 'recall': 0.7617431376842333, 'f1': 0.7585523708912013, 'support': None}, 'weighted_avg': {'precision': 0.8593253780037376, 'recall': 0.8580786026200873, 'f1': 0.8584016468418884, 'support': None}}
Loss: tensor(3.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.9174852652259332, 'contradicts': 0.6363636363636364, 'parts_of_same': 0.7170212765957447}, 'recall': {'supports': 0.9076773566569485, 'contradicts': 0.5945945945945946, 'parts_of_same': 0.7819025522041764}, 'f1': {'supports': 0.9125549584758181, 'contradicts': 0.6147704590818364, 'parts_of_same': 0.7480577136514983}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8584425036390102, 'recall': 0.8584425036390102, 'f1': 0.8584425036390102, 'support': None}, 'macro_avg': {'precision': 0.7569567260617713, 'recall': 0.7613915011519065, 'f1': 0.7584610437363842, 'support': None}, 'weighted_avg': {'precision': 0.8595484089759529, 'recall': 0.8584425036390102, 'f1': 0.8586886928781751, 'support': None}}
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.9170755642787046, 'contradicts': 0.6352459016393442, 'parts_of_same': 0.7167381974248928}, 'recall': {'supports': 0.9081632653061225, 'contradicts': 0.5984555984555985, 'parts_of_same': 0.7749419953596288}, 'f1': {'supports': 0.9125976562499999, 'contradicts': 0.6163021868787277, 'parts_of_same': 0.7447045707915274}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8580786026200873, 'recall': 0.8580786026200873, 'f1': 0.8580786026200873, 'support': None}, 'macro_avg': {'precision': 0.7563532211143139, 'recall': 0.7605202863737833, 'f1': 0.7578681379734183, 'support': None}, 'weighted_avg': {'precision': 0.8590918351165548, 'recall': 0.8580786026200873, 'f1': 0.8583391240812367, 'support': None}}
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.917156862745098, 'contradicts': 0.6352459016393442, 'parts_of_same': 0.7198275862068966}, 'recall': {'supports': 0.9091350826044704, 'contradicts': 0.5984555984555985, 'parts_of_same': 0.7749419953596288}, 'f1': {'supports': 0.913128355295266, 'contradicts': 0.6163021868787277, 'parts_of_same': 0.7463687150837989}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.858806404657933, 'recall': 0.858806404657933, 'f1': 0.858806404657933, 'support': None}, 'macro_avg': {'precision': 0.7574101168637796, 'recall': 0.7608442254732326, 'f1': 0.7585997524192641, 'support': None}, 'weighted_avg': {'precision': 0.859637264086308, 'recall': 0.858806404657933, 'f1': 0.8589975756187647, 'support': None}}
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4825e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.9162585700293829, 'contradicts': 0.6311475409836066, 'parts_of_same': 0.7207792207792207}, 'recall': {'supports': 0.9091350826044704, 'contradicts': 0.5945945945945946, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9126829268292684, 'contradicts': 0.6123260437375746, 'parts_of_same': 0.7458006718924972}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8580786026200873, 'recall': 0.8580786026200873, 'f1': 0.8580786026200873, 'support': None}, 'macro_avg': {'precision': 0.7560617772640702, 'recall': 0.7587838289812816, 'f1': 0.7569365474864468, 'support': None}, 'weighted_avg': {'precision': 0.8587275088759346, 'recall': 0.8580786026200873, 'f1': 0.8582001449520861, 'support': None}}
Loss: tensor(6.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.9162995594713657, 'contradicts': 0.6311475409836066, 'parts_of_same': 0.7223427331887202}, 'recall': {'supports': 0.9096209912536443, 'contradicts': 0.5945945945945946, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9129480614484271, 'contradicts': 0.6123260437375746, 'parts_of_same': 0.7466367713004484}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8584425036390102, 'recall': 0.8584425036390102, 'f1': 0.8584425036390102, 'support': None}, 'macro_avg': {'precision': 0.7565966112145642, 'recall': 0.7589457985310061, 'f1': 0.7573036254954834, 'support': None}, 'weighted_avg': {'precision': 0.859003429589215, 'recall': 0.8584425036390102, 'f1': 0.8585298414189912, 'support': None}}
Loss: tensor(2.4160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4032e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.9162995594713657, 'contradicts': 0.6337448559670782, 'parts_of_same': 0.7229437229437229}, 'recall': {'supports': 0.9096209912536443, 'contradicts': 0.5945945945945946, 'parts_of_same': 0.7749419953596288}, 'f1': {'supports': 0.9129480614484271, 'contradicts': 0.6135458167330677, 'parts_of_same': 0.748040313549832}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.858806404657933, 'recall': 0.858806404657933, 'f1': 0.858806404657933, 'support': None}, 'macro_avg': {'precision': 0.7576627127940556, 'recall': 0.7597191937359559, 'f1': 0.7581780639104423, 'support': None}, 'weighted_avg': {'precision': 0.8593424875095664, 'recall': 0.858806404657933, 'f1': 0.8588649389136482, 'support': None}}
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3631e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0390e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.9158924205378973, 'contradicts': 0.6337448559670782, 'parts_of_same': 0.7239130434782609}, 'recall': {'supports': 0.9101068999028182, 'contradicts': 0.5945945945945946, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9129904947599318, 'contradicts': 0.6135458167330677, 'parts_of_same': 0.7474747474747475}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.858806404657933, 'recall': 0.858806404657933, 'f1': 0.858806404657933, 'support': None}, 'macro_avg': {'precision': 0.7578501066610789, 'recall': 0.7591077680807308, 'f1': 0.7580036863225823, 'support': None}, 'weighted_avg': {'precision': 0.8591896073149914, 'recall': 0.858806404657933, 'f1': 0.8588080134321034, 'support': None}}
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9920e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0271e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4982e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5681e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.91552734375, 'contradicts': 0.6348547717842323, 'parts_of_same': 0.7254901960784313}, 'recall': {'supports': 0.9110787172011662, 'contradicts': 0.5907335907335908, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9132976132489039, 'contradicts': 0.6120000000000001, 'parts_of_same': 0.748314606741573}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.758624103870888, 'recall': 0.7581447058931788, 'f1': 0.7578707399968256, 'support': None}, 'weighted_avg': {'precision': 0.8592681709750436, 'recall': 0.8591703056768559, 'f1': 0.8590240478791348, 'support': None}}
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4578e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8110e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2701e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6525e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1503e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.91552734375, 'contradicts': 0.6348547717842323, 'parts_of_same': 0.7254901960784313}, 'recall': {'supports': 0.9110787172011662, 'contradicts': 0.5907335907335908, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9132976132489039, 'contradicts': 0.6120000000000001, 'parts_of_same': 0.748314606741573}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.758624103870888, 'recall': 0.7581447058931788, 'f1': 0.7578707399968256, 'support': None}, 'weighted_avg': {'precision': 0.8592681709750436, 'recall': 0.8591703056768559, 'f1': 0.8590240478791348, 'support': None}}
Loss: tensor(5.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1726e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2218e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9225e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3752e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1213e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7761e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5909e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3200e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1163e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.915609756097561, 'contradicts': 0.6375, 'parts_of_same': 0.7270742358078602}, 'recall': {'supports': 0.9120505344995141, 'contradicts': 0.5907335907335908, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9138266796494644, 'contradicts': 0.6132264529058116, 'parts_of_same': 0.749156355455568}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8598981077147017, 'recall': 0.8598981077147017, 'f1': 0.8598981077147015, 'support': None}, 'macro_avg': {'precision': 0.7600613306351405, 'recall': 0.7584686449926282, 'f1': 0.7587364960036146, 'support': None}, 'weighted_avg': {'precision': 0.8598276469002797, 'recall': 0.8598981077147017, 'f1': 0.8596678847243642, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0872e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5141e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9878e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6046e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3743e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1690e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2847e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2169e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2988e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5823e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9329e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3635e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2991e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6394e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6041e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8015e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.915609756097561, 'contradicts': 0.6375, 'parts_of_same': 0.7270742358078602}, 'recall': {'supports': 0.9120505344995141, 'contradicts': 0.5907335907335908, 'parts_of_same': 0.7726218097447796}, 'f1': {'supports': 0.9138266796494644, 'contradicts': 0.6132264529058116, 'parts_of_same': 0.749156355455568}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8598981077147017, 'recall': 0.8598981077147017, 'f1': 0.8598981077147015, 'support': None}, 'macro_avg': {'precision': 0.7600613306351405, 'recall': 0.7584686449926282, 'f1': 0.7587364960036146, 'support': None}, 'weighted_avg': {'precision': 0.8598276469002797, 'recall': 0.8598981077147017, 'f1': 0.8596678847243642, 'support': None}}
Loss: tensor(4.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5905e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3716e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4715e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8171e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5931e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5865e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7587e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8776e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8783e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3185e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7809e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8869e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5516e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8670e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7035e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7697e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8421e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5229e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0196e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7063e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8942e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.9142717973697029, 'contradicts': 0.6359832635983264, 'parts_of_same': 0.7280701754385965}, 'recall': {'supports': 0.9120505344995141, 'contradicts': 0.5868725868725869, 'parts_of_same': 0.7703016241299304}, 'f1': {'supports': 0.9131598151301387, 'contradicts': 0.6104417670682731, 'parts_of_same': 0.7485907553551296}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.7594417454688752, 'recall': 0.7564082485006772, 'f1': 0.7573974458511805, 'support': None}, 'weighted_avg': {'precision': 0.8588388900556224, 'recall': 0.8591703056768559, 'f1': 0.8588172972221867, 'support': None}}
Loss: tensor(7.4940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8748e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6317e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0339e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0438e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8448e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6704e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4203e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6904e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0136e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8106e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6673e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9885e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3500e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5439e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1951e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2174e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7547e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3386e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2406e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5604e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1010e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3343e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3898e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5538e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9569e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4686e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3955e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4355e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0558e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8611e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4633e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7011e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1825e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7326e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1101e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7050e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3832e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2675e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9723e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8258e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2339e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.9138686131386862, 'contradicts': 0.6359832635983264, 'parts_of_same': 0.7290748898678414}, 'recall': {'supports': 0.9125364431486881, 'contradicts': 0.5868725868725869, 'parts_of_same': 0.7679814385150812}, 'f1': {'supports': 0.9132020423048871, 'contradicts': 0.6104417670682731, 'parts_of_same': 0.7480225988700565}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.7596422555349513, 'recall': 0.755796822845452, 'f1': 0.7572221360810723, 'support': None}, 'weighted_avg': {'precision': 0.858694522796369, 'recall': 0.8591703056768559, 'f1': 0.8587598110797433, 'support': None}}
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3198e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4068e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0651e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0262e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3565e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4851e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5242e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3344e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8467e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6112e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6520e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3488e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3289e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1019e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7498e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2536e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9123e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2958e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2392e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7540e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6602e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8533e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6396e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1576e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0094e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9397e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8139e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9231e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3882e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5059e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4474e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5240e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0664e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8058e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1209e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1260e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7696e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3076e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9408e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7073e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4077e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3191e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0501e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0399e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0627e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8352e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8028e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6893e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.9138686131386862, 'contradicts': 0.6359832635983264, 'parts_of_same': 0.7290748898678414}, 'recall': {'supports': 0.9125364431486881, 'contradicts': 0.5868725868725869, 'parts_of_same': 0.7679814385150812}, 'f1': {'supports': 0.9132020423048871, 'contradicts': 0.6104417670682731, 'parts_of_same': 0.7480225988700565}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.7596422555349513, 'recall': 0.755796822845452, 'f1': 0.7572221360810723, 'support': None}, 'weighted_avg': {'precision': 0.858694522796369, 'recall': 0.8591703056768559, 'f1': 0.8587598110797433, 'support': None}}
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7334e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1236e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0593e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4574e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9653e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7936e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1167e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8304e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7161e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1280e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0074e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5819e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2995e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7313e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2368e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9353e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1245e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7922e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4960e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4490e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3693e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8485e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3311e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8649e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6384e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2629e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9180e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4266e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6361e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0800e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1797e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6315e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3570e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7529e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8545e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0737e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7401e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7207e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6863e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7750e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5719e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2341e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2770e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2682e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4505e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6049e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2430e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5388e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5061e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5439e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2775e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9370e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9188e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4935e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5017e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4211e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4527e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9562e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4586e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5768e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6388e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0255e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7990e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3419e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3781e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7322e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9624e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2434e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7607e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3629e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2437e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2842e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0104e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8328e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9144e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9582e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3747e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0293e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.9138266796494645, 'contradicts': 0.6359832635983264, 'parts_of_same': 0.7274725274725274}, 'recall': {'supports': 0.9120505344995141, 'contradicts': 0.5868725868725869, 'parts_of_same': 0.7679814385150812}, 'f1': {'supports': 0.9129377431906615, 'contradicts': 0.6104417670682731, 'parts_of_same': 0.7471783295711062}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.858806404657933, 'recall': 0.858806404657933, 'f1': 0.858806404657933, 'support': None}, 'macro_avg': {'precision': 0.7590941569067727, 'recall': 0.7556348532957274, 'f1': 0.7568526132766803, 'support': None}, 'weighted_avg': {'precision': 0.8584118017944773, 'recall': 0.858806404657933, 'f1': 0.8584294589527695, 'support': None}}
Loss: tensor(2.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2040e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3725e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6858e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4417e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8845e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8933e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5275e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4710e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9463e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6572e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8479e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1181e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3887e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8714e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4640e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3412e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1997e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4573e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7560e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0642e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8964e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5719e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7896e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7684e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2788e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6147e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6814e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0381e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3984e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0772e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2359e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3679e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5410e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8633e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3253e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0529e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0470e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4276e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9350e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0039e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3351e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5132e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9678e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8239e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0081e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5774e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8969e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1461e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9008e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6055e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4584e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8264e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4090e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8782e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2220e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1730e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9000e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6484e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1678e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5687e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1914e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9189e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8483e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6739e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0375e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3158e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5100e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6972e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1026e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3487e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8817e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6644e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5886e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5978e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7877e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5810e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1379e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3977e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5999e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1324e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5711e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0821e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9580e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0808e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1871e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0619e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7345e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3706e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7571e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7763e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1506e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7006e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0134e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0998e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3176e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4945e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9147e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1247e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0108e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8110e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2002e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6248e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7030e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1760e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7937e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8666e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3507e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1927e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8468e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4357e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1421e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7044e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5841e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4777e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0965e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5637e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6067e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8478e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4867e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1971e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0986e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3613e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0556e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6756e-07, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.9134662129314536, 'contradicts': 0.6413502109704642, 'parts_of_same': 0.7268722466960352}, 'recall': {'supports': 0.913022351797862, 'contradicts': 0.5868725868725869, 'parts_of_same': 0.765661252900232}, 'f1': {'supports': 0.9132442284325637, 'contradicts': 0.6129032258064516, 'parts_of_same': 0.7457627118644068}, 'support': {'supports': 2058, 'contradicts': 259, 'parts_of_same': 431}, 'micro_avg': {'precision': 0.8591703056768559, 'recall': 0.8591703056768559, 'f1': 0.8591703056768558, 'support': None}, 'macro_avg': {'precision': 0.7605628901993177, 'recall': 0.7551853971902269, 'f1': 0.7573033887011406, 'support': None}, 'weighted_avg': {'precision': 0.8585535331805941, 'recall': 0.8591703056768559, 'f1': 0.8586689542982701, 'support': None}}
Loss: tensor(8.4610e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7024e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6668e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4151e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0592e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5596e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2333e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0411e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1053e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6852e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7702e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4981e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1648e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5873e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9007e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7771e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5308e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7628e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2925e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9325e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2098e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3759e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4251e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9868e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5127e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3135e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0455e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3273e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5623e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2052e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6791e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7859e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6883e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8198e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6695e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6779e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2459e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8139e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0049e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3996e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7426e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5452e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0447e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6329e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4534e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6022e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0037e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8092e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8382e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0057e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5162e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5070e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2072e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2615e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4765e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4143e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1684e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5535e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3894e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5117e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1609e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1079e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5489e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0913e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9155e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1829e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6822e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9492e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6521e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0192e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6856e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6145e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2348e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2216e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0918e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2764e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3812e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2186e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7940e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3373e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2626e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5284e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9560e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3860e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0531e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6249e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8298e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4075e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1105e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5940e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1064e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2627e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5818e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1384e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6306e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7750e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7902e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2591e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7962e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2145e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3849e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3047e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9859e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6734e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4674e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7595e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0512e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7567e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7154e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0619e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9121e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4703e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5705e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9088e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9257e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7763e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3563e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3238e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3290e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0551e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1900e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4946e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0523e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5796e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4762e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2525e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4335e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4239e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2320e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5589e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8744e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0622e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9950e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1949e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2876e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2767e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3287e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0335e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0004e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9243e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3554e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5524e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9766e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4222e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1480e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0957e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4598e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7741e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3794e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8294e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7190e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5153e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7337e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6165e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3269e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9611e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9731e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2429e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8827e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0096e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4699e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3202e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0013e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3843e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5874e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8206e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4247e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8954e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2494e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0899e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4233e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0428e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7617e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5527e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6476e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5342e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6429e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6227e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1141e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0187e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3357e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8645e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5079e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4172e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7094e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8646e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7955e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0443e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6340e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6320e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8721e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2830e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9234e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9427e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8895e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8464e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8286e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7192e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2889e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4256e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1891e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2402e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4306e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9178e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0601e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7754e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4724e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4732e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5961e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1459e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8284e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7838e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2002e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8283e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0600e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0717e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9550e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3658e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1392e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2152e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3474e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8102e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2408e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2346e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2097e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6734e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2709e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1237e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7278e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1575e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6836e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2755e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5456e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4218e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2514e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1790e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9670e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9993e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5677e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9648e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8150e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9377e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0509e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2817e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5807e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6028e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0924e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3231e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4519e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1547e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5167e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4980e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2253e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7153e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9331e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2362e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2863e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8114e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8826e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0773e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3170e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5041e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7088e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9805e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1066e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6977e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2951e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3445e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9912e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9853e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8465e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4180e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0288e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9369e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5380e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3657e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8043e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4394e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8662e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8816e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1664e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4858e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0510e-08, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3908e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6116e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6910e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7521e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6057e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8699e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7433e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3533e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4130e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5255e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9957e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5343e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6292e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2583e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8963e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0376e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4482e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4924e-07, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2496e-07, device='cuda:0', grad_fn=<DivBackward0>)


		-------------RUN 5-----------
			------------EPOCH 1---------------
Evaluating
				 {'precision': {'supports': 0.7468265162200282, 'contradicts': 0.09038461538461538, 'parts_of_same': 0.16972477064220184}, 'recall': {'supports': 0.47319034852546915, 'contradicts': 0.33451957295373663, 'parts_of_same': 0.18718381112984822}, 'f1': {'supports': 0.5793216630196937, 'contradicts': 0.14231642694928084, 'parts_of_same': 0.1780272654370489}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.40616966580976865, 'recall': 0.40616966580976865, 'f1': 0.40616966580976865, 'support': None}, 'macro_avg': {'precision': 0.33564530074894844, 'recall': 0.33163124420301804, 'f1': 0.2998884518020078, 'support': None}, 'weighted_avg': {'precision': 0.5775843859943205, 'recall': 0.40616966580976865, 'f1': 0.4633942693492906, 'support': None}}
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3513, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4900, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3852, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2071, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 2---------------
Evaluating
				 {'precision': {'supports': 0.9088524590163934, 'contradicts': 0.25579053373615307, 'parts_of_same': 0.6094276094276094}, 'recall': {'supports': 0.6193029490616622, 'contradicts': 0.9039145907473309, 'parts_of_same': 0.6104553119730185}, 'f1': {'supports': 0.7366462928514482, 'contradicts': 0.3987441130298273, 'parts_of_same': 0.6099410278011794}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.6433161953727506, 'recall': 0.6433161953727506, 'f1': 0.6433161953727506, 'support': None}, 'macro_avg': {'precision': 0.5913568673933853, 'recall': 0.7112242839273373, 'f1': 0.5817771445608183, 'support': None}, 'weighted_avg': {'precision': 0.7928276078564009, 'recall': 0.6433161953727506, 'f1': 0.6819911724450585, 'support': None}}
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1753, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0986, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2687, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0991, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0708, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1700, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1837, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0459, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1698, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1834, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1887, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0994, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 3---------------
Evaluating
				 {'precision': {'supports': 0.9296875, 'contradicts': 0.303595206391478, 'parts_of_same': 0.4700944386149003}, 'recall': {'supports': 0.5848972296693477, 'contradicts': 0.8113879003558719, 'parts_of_same': 0.7554806070826307}, 'f1': {'supports': 0.7180471749862863, 'contradicts': 0.4418604651162791, 'parts_of_same': 0.5795601552393272}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.637853470437018, 'recall': 0.637853470437018, 'f1': 0.637853470437018, 'support': None}, 'macro_avg': {'precision': 0.5677923816687928, 'recall': 0.7172552457026168, 'f1': 0.5798225984472976, 'support': None}, 'weighted_avg': {'precision': 0.7855774036293833, 'recall': 0.637853470437018, 'f1': 0.6667196466497122, 'support': None}}
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1962, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0740, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0868, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3882, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2757, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0901, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9830, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0660, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7348, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3841, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0959, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1770, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2537, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0966, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0772, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0806, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0848, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3611, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1452, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0985, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0357, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0618, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1855, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3917, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0652, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 4---------------
Evaluating
				 {'precision': {'supports': 0.9053185271770894, 'contradicts': 0.32084690553745926, 'parts_of_same': 0.5692503176620076}, 'recall': {'supports': 0.6921358355674709, 'contradicts': 0.701067615658363, 'parts_of_same': 0.7554806070826307}, 'f1': {'supports': 0.7845024056723221, 'contradicts': 0.44022346368715076, 'parts_of_same': 0.6492753623188405}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7050128534704371, 'recall': 0.7050128534704371, 'f1': 0.7050128534704371, 'support': None}, 'macro_avg': {'precision': 0.5984719167921854, 'recall': 0.7162280194361549, 'f1': 0.6246670772261045, 'support': None}, 'weighted_avg': {'precision': 0.7885045895411062, 'recall': 0.7050128534704371, 'f1': 0.7276476436522553, 'support': None}}
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0702, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0843, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0956, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1839, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0828, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0942, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8768, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1807, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0813, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0911, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1952, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0565, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0715, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0629, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0428, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4908, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4926, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1775, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0733, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1649, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1921, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1914, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1606, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0622, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0390, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4640, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3797, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0678, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9739, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4979, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3805, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1854, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0605, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 5---------------
Evaluating
				 {'precision': {'supports': 0.8902316213494461, 'contradicts': 0.4707379134860051, 'parts_of_same': 0.5634379263301501}, 'recall': {'supports': 0.7899910634495085, 'contradicts': 0.6583629893238434, 'parts_of_same': 0.6964586846543002}, 'f1': {'supports': 0.8371212121212122, 'contradicts': 0.5489614243323442, 'parts_of_same': 0.6229260935143288}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7602827763496144, 'recall': 0.7602827763496144, 'f1': 0.7602827763496144, 'support': None}, 'macro_avg': {'precision': 0.6414691537218671, 'recall': 0.7149375791425507, 'f1': 0.6696695766559616, 'support': None}, 'weighted_avg': {'precision': 0.7900817521154907, 'recall': 0.7602827763496144, 'f1': 0.7702861845818311, 'support': None}}
Loss: tensor(0.0666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0760, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0681, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0713, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0496, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0569, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0771, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2561, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0451, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0889, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0317, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0730, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1690, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0749, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1510, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0989, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5976, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0731, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4604, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0520, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2902, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 6---------------
Evaluating
				 {'precision': {'supports': 0.8962962962962963, 'contradicts': 0.3069053708439898, 'parts_of_same': 0.6452173913043479}, 'recall': {'supports': 0.7028596961572833, 'contradicts': 0.8540925266903915, 'parts_of_same': 0.6256323777403036}, 'f1': {'supports': 0.787878787878788, 'contradicts': 0.451552210724365, 'parts_of_same': 0.6352739726027397}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7017994858611826, 'recall': 0.7017994858611826, 'f1': 0.7017994858611826, 'support': None}, 'macro_avg': {'precision': 0.6161396861482112, 'recall': 0.7275282001959927, 'f1': 0.6249016570686309, 'support': None}, 'weighted_avg': {'precision': 0.7952331084067321, 'recall': 0.7017994858611826, 'f1': 0.728430708303245, 'support': None}}
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0944, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0727, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5654, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0860, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0295, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0804, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0737, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1728, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3526, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2953, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8400, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7717, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 7---------------
Evaluating
				 {'precision': {'supports': 0.8603448275862069, 'contradicts': 0.6115702479338843, 'parts_of_same': 0.6618181818181819}, 'recall': {'supports': 0.8918677390527256, 'contradicts': 0.5266903914590747, 'parts_of_same': 0.6138279932546374}, 'f1': {'supports': 0.8758227292672225, 'contradicts': 0.5659655831739961, 'parts_of_same': 0.636920384951881}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8059125964010283, 'recall': 0.8059125964010283, 'f1': 0.8059125964010282, 'support': None}, 'macro_avg': {'precision': 0.7112444191127576, 'recall': 0.6774620412554793, 'f1': 0.6929028991310332, 'support': None}, 'weighted_avg': {'precision': 0.8000517820133466, 'recall': 0.8059125964010283, 'f1': 0.8023204965451164, 'support': None}}
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0326, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2699, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0746, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0973, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0810, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4965, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0968, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0884, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1636, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1922, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2540, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1811, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 8---------------
Evaluating
				 {'precision': {'supports': 0.868903803131991, 'contradicts': 0.48656716417910445, 'parts_of_same': 0.6734317343173432}, 'recall': {'supports': 0.8677390527256479, 'contradicts': 0.5800711743772242, 'parts_of_same': 0.6155143338954469}, 'f1': {'supports': 0.8683210373351219, 'contradicts': 0.5292207792207791, 'parts_of_same': 0.6431718061674009}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7937017994858612, 'recall': 0.7937017994858612, 'f1': 0.7937017994858612, 'support': None}, 'macro_avg': {'precision': 0.6763009005428128, 'recall': 0.6877748536661064, 'f1': 0.6802378742411007, 'support': None}, 'weighted_avg': {'precision': 0.7971327451779913, 'recall': 0.7937017994858612, 'f1': 0.7947989722282488, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4684, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1564, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0814, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3796, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1940, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0642, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2844, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1981, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0756, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6273, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2433, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0607, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0447, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6369, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5762, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0359, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8808, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3798, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0794, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2460, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0776, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2970, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0495, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0415, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5554, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0949, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1799, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 9---------------
Evaluating
				 {'precision': {'supports': 0.8748828491096532, 'contradicts': 0.4664804469273743, 'parts_of_same': 0.6306451612903226}, 'recall': {'supports': 0.8342269883824843, 'contradicts': 0.594306049822064, 'parts_of_same': 0.6593591905564924}, 'f1': {'supports': 0.854071363220494, 'contradicts': 0.5226917057902974, 'parts_of_same': 0.6446826051112943}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7792416452442159, 'recall': 0.7792416452442159, 'f1': 0.7792416452442159, 'support': None}, 'macro_avg': {'precision': 0.65733615244245, 'recall': 0.6959640762536802, 'f1': 0.6738152247073619, 'support': None}, 'weighted_avg': {'precision': 0.7914657463172098, 'recall': 0.7792416452442159, 'f1': 0.784249635297409, 'support': None}}
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0915, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6615, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0720, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1619, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7567, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3608, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0284, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6861, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0627, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0120, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1575, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7925, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0898, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0878, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0252, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0741, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0250, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5402, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6793, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3676, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0697, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2623, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0381, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0603, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0972, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0958, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0493, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0558, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0910, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3778, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0515, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0593, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1446, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0243, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 10---------------
Evaluating
				 {'precision': {'supports': 0.8931492842535788, 'contradicts': 0.47554347826086957, 'parts_of_same': 0.5545685279187818}, 'recall': {'supports': 0.7806076854334227, 'contradicts': 0.6227758007117438, 'parts_of_same': 0.7369308600337268}, 'f1': {'supports': 0.8330948974725799, 'contradicts': 0.539291217257319, 'parts_of_same': 0.6328747284576394}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7580334190231363, 'recall': 0.7580334190231363, 'f1': 0.7580334190231363, 'support': None}, 'macro_avg': {'precision': 0.6410870968110767, 'recall': 0.7134381153929645, 'f1': 0.6684202810625127, 'support': None}, 'weighted_avg': {'precision': 0.7909238279584354, 'recall': 0.7580334190231363, 'f1': 0.7684132154782521, 'support': None}}
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0930, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0420, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0758, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0320, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0277, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3779, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0283, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0464, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0529, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0650, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3648, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0486, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0943, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7873, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 11---------------
Evaluating
				 {'precision': {'supports': 0.8630669546436285, 'contradicts': 0.5475285171102662, 'parts_of_same': 0.7078651685393258}, 'recall': {'supports': 0.8927613941018767, 'contradicts': 0.5124555160142349, 'parts_of_same': 0.6374367622259697}, 'f1': {'supports': 0.8776630792883813, 'contradicts': 0.5294117647058825, 'parts_of_same': 0.670807453416149}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8097686375321337, 'recall': 0.8097686375321337, 'f1': 0.8097686375321337, 'support': None}, 'macro_avg': {'precision': 0.7061535467644068, 'recall': 0.6808845574473604, 'f1': 0.6926274324701375, 'support': None}, 'weighted_avg': {'precision': 0.805001093426814, 'recall': 0.8097686375321337, 'f1': 0.8068006096418787, 'support': None}}
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5659, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6842e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9208e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 12---------------
Evaluating
				 {'precision': {'supports': 0.8555602897315722, 'contradicts': 0.5492424242424242, 'parts_of_same': 0.7145708582834331}, 'recall': {'supports': 0.8972296693476318, 'contradicts': 0.5160142348754448, 'parts_of_same': 0.6037099494097807}, 'f1': {'supports': 0.8758996728462377, 'contradicts': 0.5321100917431193, 'parts_of_same': 0.6544789762340036}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8068766066838047, 'recall': 0.8068766066838047, 'f1': 0.8068766066838047, 'support': None}, 'macro_avg': {'precision': 0.7064578574191431, 'recall': 0.6723179512109524, 'f1': 0.6874962469411202, 'support': None}, 'weighted_avg': {'precision': 0.8010352084169202, 'recall': 0.8068766066838047, 'f1': 0.8026646646903794, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 13---------------
Evaluating
				 {'precision': {'supports': 0.8645558487247141, 'contradicts': 0.5152542372881356, 'parts_of_same': 0.6961325966850829}, 'recall': {'supports': 0.8784629133154602, 'contradicts': 0.5409252669039146, 'parts_of_same': 0.6374367622259697}, 'f1': {'supports': 0.8714539007092199, 'contradicts': 0.5277777777777779, 'parts_of_same': 0.6654929577464789}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8020565552699229, 'recall': 0.8020565552699229, 'f1': 0.802056555269923, 'support': None}, 'macro_avg': {'precision': 0.6919808942326441, 'recall': 0.6856083141484483, 'f1': 0.6882415454111589, 'support': None}, 'weighted_avg': {'precision': 0.8009219344338465, 'recall': 0.8020565552699229, 'f1': 0.8011750351177545, 'support': None}}
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4086e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 14---------------
Evaluating
				 {'precision': {'supports': 0.8651488616462347, 'contradicts': 0.5314685314685315, 'parts_of_same': 0.6974169741697417}, 'recall': {'supports': 0.8829311885612153, 'contradicts': 0.5409252669039146, 'parts_of_same': 0.6374367622259697}, 'f1': {'supports': 0.8739495798319329, 'contradicts': 0.5361552028218695, 'parts_of_same': 0.666079295154185}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8052699228791774, 'recall': 0.8052699228791774, 'f1': 0.8052699228791774, 'support': None}, 'macro_avg': {'precision': 0.6980114557615026, 'recall': 0.6870977392303664, 'f1': 0.6920613592693291, 'support': None}, 'weighted_avg': {'precision': 0.8030572221688907, 'recall': 0.8052699228791774, 'f1': 0.803837979975335, 'support': None}}
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 15---------------
Evaluating
				 {'precision': {'supports': 0.8600257621296694, 'contradicts': 0.5595238095238095, 'parts_of_same': 0.7024482109227872}, 'recall': {'supports': 0.8949955317247542, 'contradicts': 0.501779359430605, 'parts_of_same': 0.6290050590219224}, 'f1': {'supports': 0.8771622509305891, 'contradicts': 0.5290806754221389, 'parts_of_same': 0.6637010676156584}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8088046272493573, 'recall': 0.8088046272493573, 'f1': 0.8088046272493573, 'support': None}, 'macro_avg': {'precision': 0.7073325941920888, 'recall': 0.6752599833924272, 'f1': 0.6899813313227955, 'support': None}, 'weighted_avg': {'precision': 0.8028649213366336, 'recall': 0.8088046272493573, 'f1': 0.8050564011800658, 'support': None}}
Loss: tensor(9.9416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8750e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3766e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4546e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3964, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7660e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 16---------------
Evaluating
				 {'precision': {'supports': 0.8615318044136737, 'contradicts': 0.5468164794007491, 'parts_of_same': 0.702247191011236}, 'recall': {'supports': 0.889633601429848, 'contradicts': 0.5195729537366548, 'parts_of_same': 0.6323777403035413}, 'f1': {'supports': 0.8753572213673334, 'contradicts': 0.5328467153284672, 'parts_of_same': 0.6654835847382431}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.8071979434447301, 'recall': 0.8071979434447301, 'f1': 0.8071979434447301, 'support': None}, 'macro_avg': {'precision': 0.7035318249418863, 'recall': 0.6805280984900147, 'f1': 0.6912291738113479, 'support': None}, 'weighted_avg': {'precision': 0.8027622728981604, 'recall': 0.8071979434447301, 'f1': 0.8044380315479336, 'support': None}}
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2243e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3742e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0673, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8654e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0851, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0157, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0412, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1881, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1932, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1247, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0590, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1978, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2508, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2394, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3311, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0759, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2742, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5904, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6323, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3610, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3368, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0600, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1745, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0821, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3896, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 17---------------
Evaluating
				 {'precision': {'supports': 0.8503683241252302, 'contradicts': 0.42424242424242425, 'parts_of_same': 0.5885245901639344}, 'recall': {'supports': 0.8252904378909741, 'contradicts': 0.498220640569395, 'parts_of_same': 0.6053962900505903}, 'f1': {'supports': 0.8376417233560091, 'contradicts': 0.458265139116203, 'parts_of_same': 0.5968412302576891}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7538560411311054, 'recall': 0.7538560411311054, 'f1': 0.7538560411311054, 'support': None}, 'macro_avg': {'precision': 0.621045112843863, 'recall': 0.6429691228369865, 'f1': 0.6309160309099671, 'support': None}, 'weighted_avg': {'precision': 0.7619959873302056, 'recall': 0.7538560411311054, 'f1': 0.757500491807587, 'support': None}}
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0993, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1517, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4563, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0531, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6791, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0560, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0536, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7502, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3826, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1471, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4857, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1443, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1596, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0499, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0366, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0483, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4658, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8721, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2448, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1734, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8992, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0874, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0547, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0639, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1906, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1750, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0664, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1897, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2838, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2927, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0645, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0414, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2538, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0767, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0444, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0580, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0382, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1916, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0833, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2666, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2845, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0877, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0467, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1391, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0670, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0429, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2000, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2457, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0764, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0229, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1296, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1876, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2384, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8957, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0282, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0237, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0825, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0586, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0706, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0938, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0438, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0735, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0189, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0462, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2891, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0987, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0748, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0319, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2482, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8674, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1339, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1419, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0800, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0334, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6835, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2990, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3474, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0195, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2777, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0568, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3344, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0710, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0765, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0668, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1875, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0947, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4478, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3960, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6682, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0790, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0795, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0725, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0519, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1598, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0375, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0816, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0625, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4692, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1671, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3782, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0719, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0232, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0718, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0680, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9856, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2491, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0427, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0488, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0913, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0516, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0454, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2411, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0862, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0307, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6450, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0270, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4999, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0407, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0587, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3726, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2373, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0579, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0378, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0696, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4907, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3525, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0374, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0215, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0134, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0977, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0522, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0792, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0274, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3397, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1812, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0754, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0350, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0875, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 18---------------
Evaluating
				 {'precision': {'supports': 0.8638580931263858, 'contradicts': 0.5296167247386759, 'parts_of_same': 0.6543859649122807}, 'recall': {'supports': 0.870420017873101, 'contradicts': 0.5409252669039146, 'parts_of_same': 0.6290050590219224}, 'f1': {'supports': 0.8671266414422435, 'contradicts': 0.5352112676056338, 'parts_of_same': 0.6414445399828032}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7946658097686375, 'recall': 0.7946658097686375, 'f1': 0.7946658097686377, 'support': None}, 'macro_avg': {'precision': 0.6826202609257809, 'recall': 0.6801167812663126, 'f1': 0.6812608163435602, 'support': None}, 'weighted_avg': {'precision': 0.7937620788115045, 'recall': 0.7946658097686375, 'f1': 0.7941518001139867, 'support': None}}
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0533, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3872, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9732, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0543, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1401, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7382e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0435, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0301, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2387, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1230e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0104, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0628, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0205, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5214e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0743, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7334e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3209, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0557, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0885, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0303, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0354, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0707, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3849, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0328, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0322, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2716, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1709, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9974, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0240, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0621, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0202, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0577, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0663, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6651e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6995, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2836, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3867, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3484, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1924, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2935, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0933, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0231, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1392, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5571, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2312, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5395e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3321, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4033, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 19---------------
Evaluating
				 {'precision': {'supports': 0.8623410784743534, 'contradicts': 0.45478723404255317, 'parts_of_same': 0.7384615384615385}, 'recall': {'supports': 0.8789097408400357, 'contradicts': 0.608540925266904, 'parts_of_same': 0.5666104553119731}, 'f1': {'supports': 0.8705465811020137, 'contradicts': 0.5205479452054794, 'parts_of_same': 0.6412213740458015}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7949871465295629, 'recall': 0.7949871465295629, 'f1': 0.7949871465295629, 'support': None}, 'macro_avg': {'precision': 0.685196616992815, 'recall': 0.684687040472971, 'f1': 0.6774386334510982, 'support': None}, 'weighted_avg': {'precision': 0.8019351666771377, 'recall': 0.7949871465295629, 'f1': 0.7952446966318144, 'support': None}}
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0588, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4383, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0524, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2723, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0647, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0178, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0662, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0489, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0919, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0895, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0788, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0220, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0198, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0761, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0551, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2755, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0859, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0179, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0503, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0188, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0724, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0541, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6492, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0842, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0249, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0996, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1405, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0691, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1399, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0271, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3490, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0657, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3297, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0190, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0485, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0266, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2677, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0149, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0963, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0866, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1785, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9544, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(10.2951, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0318, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5781, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0969, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1817, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0158, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0241, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0256, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0863, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0281, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0468, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0146, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3548, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5937, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0819, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2967, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0142, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0136, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0238, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0840, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2703, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0920, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0521, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0418, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0661, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1436, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0404, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2224, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0688, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0286, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0117, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1829, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0246, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0164, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0638, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0455, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0293, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4948, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1325, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0389, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1285, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0528, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0384, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 20---------------
Evaluating
				 {'precision': {'supports': 0.8908450704225352, 'contradicts': 0.4708333333333333, 'parts_of_same': 0.5192307692307693}, 'recall': {'supports': 0.7913315460232351, 'contradicts': 0.40213523131672596, 'parts_of_same': 0.7740303541315345}, 'f1': {'supports': 0.8381448177946049, 'contradicts': 0.4337811900191938, 'parts_of_same': 0.6215301286391334}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.752892030848329, 'recall': 0.752892030848329, 'f1': 0.752892030848329, 'support': None}, 'macro_avg': {'precision': 0.6269697243288793, 'recall': 0.6558323771571651, 'f1': 0.6311520454843107, 'support': None}, 'weighted_avg': {'precision': 0.7821077379261396, 'recall': 0.752892030848329, 'f1': 0.7603560356371225, 'support': None}}
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5534, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0509, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0300, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1931, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0168, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1406, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0555, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0983, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0268, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0338, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0398, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0801, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0353, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2631, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0172, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0335, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0714, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0578, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0601, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0363, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0138, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0276, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0549, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0278, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0356, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1424, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0119, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8864e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0789, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0309, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0280, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0815, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3624, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0347, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0689, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1208, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2712, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0432, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0784, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5494, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1918, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4552, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0367, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0899, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 21---------------
Evaluating
				 {'precision': {'supports': 0.858647936786655, 'contradicts': 0.4628099173553719, 'parts_of_same': 0.7239915074309978}, 'recall': {'supports': 0.8739946380697051, 'contradicts': 0.597864768683274, 'parts_of_same': 0.5750421585160203}, 'f1': {'supports': 0.8662533215234721, 'contradicts': 0.5217391304347825, 'parts_of_same': 0.6409774436090225}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7920951156812339, 'recall': 0.7920951156812339, 'f1': 0.792095115681234, 'support': None}, 'macro_avg': {'precision': 0.681816453857675, 'recall': 0.682300521756333, 'f1': 0.6763232985224258, 'support': None}, 'weighted_avg': {'precision': 0.7972463474331539, 'recall': 0.7920951156812339, 'f1': 0.7922182690494391, 'support': None}}
Loss: tensor(7.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2971, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0530, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0521e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9883e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0258, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0365, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6769, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0998, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0175, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1672, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0106, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7819e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0139, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1582, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1945, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2635, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0597, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8879, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1166, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0176, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0345, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0883, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5847, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6535, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1316, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0177, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0853, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0550, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3679, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5395, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1928, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4644, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0669, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3665, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0362, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3675, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5441, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2267, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0197, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1173, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0634, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0261, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0199, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0153, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0183, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0213, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0147, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0799, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0105, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0095, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0641, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0850, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0156, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0159, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0997, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4546, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 22---------------
Evaluating
				 {'precision': {'supports': 0.8579040852575488, 'contradicts': 0.48580441640378547, 'parts_of_same': 0.6445672191528545}, 'recall': {'supports': 0.8632707774798928, 'contradicts': 0.5480427046263345, 'parts_of_same': 0.5902192242833052}, 'f1': {'supports': 0.8605790645879734, 'contradicts': 0.5150501672240803, 'parts_of_same': 0.6161971830985915}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7827763496143959, 'recall': 0.7827763496143959, 'f1': 0.7827763496143959, 'support': None}, 'macro_avg': {'precision': 0.6627585736047296, 'recall': 0.6671775687965108, 'f1': 0.6639421383035483, 'support': None}, 'weighted_avg': {'precision': 0.7836531956213049, 'recall': 0.7827763496143959, 'f1': 0.7828116880190603, 'support': None}}
Loss: tensor(0.0439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0980, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0314, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8434, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0581, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0143, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1181, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0235, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0160, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0693, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4379, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2747, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0559, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1553, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0263, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0346, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0803, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0886, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0330, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0351, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2566, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0103, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0259, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0109, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0302, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2385, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0298, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3773, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9984, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0602, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9481, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0461, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0982, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3185, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0630, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0763, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0315, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0192, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2523, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0506, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0219, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0150, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0210, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2620, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0871, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0113, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0211, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0279, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5305, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0626, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0469, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0498, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4511, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0372, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7216, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3291, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0923, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5961, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0343, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4294, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0929, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0556, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1617, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1239, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0129, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1233, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0255, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3360, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6711, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2358, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2865, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0514, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0539, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0466, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8595, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2115, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0809, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0472, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0212, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2545, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0864, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0946, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0206, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1570, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1766, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0612, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0077, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0308, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0094, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0126, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0458, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0154, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0386, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0331, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0475, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0376, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.9180, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0217, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0063, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0341, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2327, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0695, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0098, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0988, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6975, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0336, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5824, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0306, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1182, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0340, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0110, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0787, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1912, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0299, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2934, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0200, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0416, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1512, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7903, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0269, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0786, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0218, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0260, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0221, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0072, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0442, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0081, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1396, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1230, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0820, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0127, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2453, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7184, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0123, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0342, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0075, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0822, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0254, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6880, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0609, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0479, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0169, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3616, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5686, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0128, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0361, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0140, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0584, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1685, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0497, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0430, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0893, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2637, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0174, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0155, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9802, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0736, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0088, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0614, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0832, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5633, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3905, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1226, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0265, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4148, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0121, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1585, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0403, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8683, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0245, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6950, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2888, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0869, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0194, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0275, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0518, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0656, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0193, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4655, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0092, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0592, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1251, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0572, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0370, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0228, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0573, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9731e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1574, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0409, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1171, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0936, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0470, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4704, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3591, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0909, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0332, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0371, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0187, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1289, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0527, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0223, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6144, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0456, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3651, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6589, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2894, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0145, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0122, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0738, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1473, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0264, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0653, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3505, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1417, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.6701, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0090, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0431, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0667, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0818, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0858, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0364, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0207, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0313, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0167, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2954, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0646, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0163, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0107, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0204, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0476, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1161, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0337, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0112, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0594, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3425, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0410, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0152, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4349, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.4892, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0272, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3751, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0310, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2729, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0780, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2426, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2101, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0065, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1287, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0033, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0643, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0242, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3939, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0118, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2408, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0222, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0141, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1504, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0599, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0422, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0076, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0413, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3783, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0084, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0108, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2186, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2479e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0053, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0445, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0248, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0111, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 23---------------
Evaluating
				 {'precision': {'supports': 0.8675555555555555, 'contradicts': 0.5015479876160991, 'parts_of_same': 0.6883116883116883}, 'recall': {'supports': 0.872207327971403, 'contradicts': 0.5765124555160143, 'parts_of_same': 0.6256323777403036}, 'f1': {'supports': 0.8698752228163992, 'contradicts': 0.5364238410596026, 'parts_of_same': 0.6554770318021201}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7985218508997429, 'recall': 0.7985218508997429, 'f1': 0.798521850899743, 'support': None}, 'macro_avg': {'precision': 0.6858050771611143, 'recall': 0.6914507204092403, 'f1': 0.6872586985593739, 'support': None}, 'weighted_avg': {'precision': 0.8003512689660309, 'recall': 0.7985218508997429, 'f1': 0.7989118662787619, 'support': None}}
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0067, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0082, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0102, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0352, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0061, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0421, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0049, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0393, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7941, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0080, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.8449, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0380, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0752, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0823, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1100, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0290, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0465, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1532, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0225, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0035, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0201, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0124, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0423, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0091, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0613, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0089, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0463, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0074, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0162, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0062, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0500, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0165, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0196, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0388, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2744, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0632, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0125, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0292, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0031, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0085, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0253, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0583, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0070, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0542, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0116, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0071, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0087, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0203, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0044, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0132, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0058, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0096, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0079, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0083, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0091e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0068, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0133, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0377, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0355, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0052, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1722, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0234, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1831, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0151, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0137, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0069, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0214, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0774, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0097, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0262, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0170, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0477, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0048, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0827, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.7439, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0055, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0042, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0028, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0694, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0440, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0064, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3049e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7170e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0041, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0329, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9837e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.1437, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0040, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3562, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0333, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0288, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0066, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0114, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0244, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0576, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0038, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0037, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0047, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3691e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6180e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0027, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0507, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0257, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.2034, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0025, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0046, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.5480, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0501, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0059, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0015, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0227, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0131, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0135, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0890, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.3191, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7845e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 24---------------
Evaluating
				 {'precision': {'supports': 0.8528656971770744, 'contradicts': 0.5555555555555556, 'parts_of_same': 0.6686159844054581}, 'recall': {'supports': 0.8909740840035746, 'contradicts': 0.5160142348754448, 'parts_of_same': 0.5784148397976391}, 'f1': {'supports': 0.8715034965034965, 'contradicts': 0.5350553505535056, 'parts_of_same': 0.620253164556962}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7975578406169666, 'recall': 0.7975578406169666, 'f1': 0.7975578406169666, 'support': None}, 'macro_avg': {'precision': 0.692345745712696, 'recall': 0.6618010528922195, 'f1': 0.6756040038713214, 'support': None}, 'weighted_avg': {'precision': 0.7909106105867096, 'recall': 0.7975578406169666, 'f1': 0.7932472703286113, 'support': None}}
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7664e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0057, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0029, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8656e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0078, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0073, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0060, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0304, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0051, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7797e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0056, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0093, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0130, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0099, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7555e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0045, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4145e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0043, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0030, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0324, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0036, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0039, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0022, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0054, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0020, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0487, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0019, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 25---------------
Evaluating
				 {'precision': {'supports': 0.8563991323210413, 'contradicts': 0.5062111801242236, 'parts_of_same': 0.6845360824742268}, 'recall': {'supports': 0.8820375335120644, 'contradicts': 0.5800711743772242, 'parts_of_same': 0.5598650927487352}, 'f1': {'supports': 0.8690292758089369, 'contradicts': 0.5406301824212272, 'parts_of_same': 0.6159554730983302}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7933804627249358, 'recall': 0.7933804627249358, 'f1': 0.7933804627249358, 'support': None}, 'macro_avg': {'precision': 0.6823821316398305, 'recall': 0.6739912668793413, 'f1': 0.6752049771094981, 'support': None}, 'weighted_avg': {'precision': 0.7920297225760327, 'recall': 0.7933804627249358, 'f1': 0.791152376628559, 'support': None}}
Loss: tensor(3.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0018, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2204e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5621e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0245e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6835e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9222e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0570e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0026, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4310e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3271e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4696e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1013e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0024, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4193e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0086, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0541e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3473e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3774e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4098e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0011, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6436e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 26---------------
Evaluating
				 {'precision': {'supports': 0.8573281452658884, 'contradicts': 0.5192307692307693, 'parts_of_same': 0.6878850102669405}, 'recall': {'supports': 0.886058981233244, 'contradicts': 0.5765124555160143, 'parts_of_same': 0.5649241146711635}, 'f1': {'supports': 0.8714568226763348, 'contradicts': 0.5463743676222598, 'parts_of_same': 0.6203703703703705}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7969151670951157, 'recall': 0.7969151670951157, 'f1': 0.7969151670951157, 'support': None}, 'macro_avg': {'precision': 0.6881479749211993, 'recall': 0.6758318504734739, 'f1': 0.6794005202229885, 'support': None}, 'weighted_avg': {'precision': 0.7945115830164525, 'recall': 0.7969151670951157, 'f1': 0.7942580964270958, 'support': None}}
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5954e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3693e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9682e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4393e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8810e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0021, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8733e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5937e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8714e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6118e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3224e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4482e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0080e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2451e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4177e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8406e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0357e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6737e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2962e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0050, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9211e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0966e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1248e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6697e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5053e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0058e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7055e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2000e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0553e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9197e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6663e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7738e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5537e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9497e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2782e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1315e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4822e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9414e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1736e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4671e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7288e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0014, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3899e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8591e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 27---------------
Evaluating
				 {'precision': {'supports': 0.8569576490924805, 'contradicts': 0.5227272727272727, 'parts_of_same': 0.6836734693877551}, 'recall': {'supports': 0.886058981233244, 'contradicts': 0.5729537366548043, 'parts_of_same': 0.5649241146711635}, 'f1': {'supports': 0.8712653778558876, 'contradicts': 0.5466893039049237, 'parts_of_same': 0.61865189289012}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7965938303341902, 'recall': 0.7965938303341902, 'f1': 0.7965938303341902, 'support': None}, 'macro_avg': {'precision': 0.6877861304025027, 'recall': 0.6746456108530706, 'f1': 0.6788688582169771, 'support': None}, 'weighted_avg': {'precision': 0.7937583385772088, 'recall': 0.7965938303341902, 'f1': 0.7938213954121469, 'support': None}}
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4293e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8823e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9582e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6844e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7916e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6301e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8500e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4672e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2861e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3466e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0016, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8600e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6817e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1316e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3586e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4335e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9740e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8052e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8344e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1638e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0185e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9741e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3022e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0146e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8043e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5188e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3534e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4675e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1158e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7206e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5034e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5757e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9833e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3303e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2654e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1611e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5815e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8275e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9655e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8835e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3767e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6588e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5281e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3858e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8928e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5016e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5136e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6482e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7648e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5949e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9640e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4426e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0010, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9530e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1106e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8203e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0032, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6453e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8268e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8102e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2434e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4297e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4491e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3947e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8727e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9690e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8397e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0914e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9587e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2887e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5939e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7684e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6888e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9995e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6027e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5576e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4026e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1458e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2755e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3220e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2068e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3460e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4287e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 28---------------
Evaluating
				 {'precision': {'supports': 0.8570811744386874, 'contradicts': 0.5264900662251656, 'parts_of_same': 0.6862348178137652}, 'recall': {'supports': 0.886952636282395, 'contradicts': 0.5658362989323843, 'parts_of_same': 0.5716694772344013}, 'f1': {'supports': 0.8717610891523935, 'contradicts': 0.5454545454545454, 'parts_of_same': 0.6237350505979761}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.797879177377892, 'recall': 0.797879177377892, 'f1': 0.797879177377892, 'support': None}, 'macro_avg': {'precision': 0.6899353528258727, 'recall': 0.6748194708163936, 'f1': 0.6803168950683051, 'support': None}, 'weighted_avg': {'precision': 0.7946750077013549, 'recall': 0.797879177377892, 'f1': 0.7950350031492236, 'support': None}}
Loss: tensor(1.9645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3079e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5665e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6119e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9637e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8007e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9162e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9419e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8382e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5103e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7493e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0012, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9828e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0360e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4325e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0023, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0745e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9718e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4427e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9511e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3885e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4307e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3321e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2599e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9967e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2543e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8715e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5249e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9152e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5603e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9100e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5751e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6566e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4548e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8473e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1820e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3509e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7448e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6491e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9784e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1259e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2795e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5195e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8343e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7217e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2779e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4159e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8890e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1135e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7084e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1639e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6578e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0008, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6197e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6384e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7054e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8646e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4615e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1051e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8517e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2688e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9859e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8112e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2649e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6658e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6462e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9844e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6912e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7258e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5150e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6946e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3212e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1947e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4129e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9380e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7082e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8050e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8708e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4759e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0752e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4809e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0811e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1556e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4650e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0327e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2347e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0915e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4398e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8698e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2036e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7201e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3882e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0407e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6604e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7172e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8786e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0609e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1657e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4149e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1059e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4853e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7533e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3867e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4402e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3522e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4161e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0733e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8243e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3265e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3109e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5239e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9129e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2040e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8181e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5234e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4663e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9921e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6164e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3560e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7378e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3431e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0390e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4716e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2363e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8289e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1595e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8917e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6224e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7814e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9678e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5440e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7726e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7907e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0420e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6208e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3672e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3804e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4272e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2134e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0470e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7658e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9214e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7232e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5442e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9503e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0010e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1583e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1111e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 29---------------
Evaluating
				 {'precision': {'supports': 0.8571428571428571, 'contradicts': 0.5284280936454849, 'parts_of_same': 0.6854838709677419}, 'recall': {'supports': 0.8873994638069705, 'contradicts': 0.5622775800711743, 'parts_of_same': 0.5733558178752108}, 'f1': {'supports': 0.8720087815587266, 'contradicts': 0.5448275862068966, 'parts_of_same': 0.6244260789715335}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7982005141388174, 'recall': 0.7982005141388174, 'f1': 0.7982005141388173, 'support': None}, 'macro_avg': {'precision': 0.6903516072520279, 'recall': 0.6743442872511186, 'f1': 0.6804208155790522, 'support': None}, 'weighted_avg': {'precision': 0.7947512673791665, 'recall': 0.7982005141388174, 'f1': 0.795288197198807, 'support': None}}
Loss: tensor(5.2676e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5266e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0455e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4944e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6707e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8796e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6792e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1896e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8635e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7294e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5965e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5971e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3992e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6800e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1780e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8879e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2120e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2001e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5660e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8642e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9241e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6478e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9895e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6627e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0567e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3840e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7062e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3757e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0006, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5765e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5484e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2133e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5320e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6520e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3404e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3576e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8064e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2499e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2573e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8932e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9016e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5259e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3585e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7873e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1683e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1277e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2221e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5374e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6634e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1686e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2128e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0799e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5061e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8155e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6565e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4897e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7285e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6295e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7121e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0551e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7673e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5938e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5802e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5436e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2589e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5396e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0740e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6805e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4017e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3377e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8787e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1225e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6631e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4787e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5339e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8492e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9231e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0935e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7749e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7157e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7124e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8472e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0624e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9285e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4166e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3734e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1095e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0017, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1760e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1299e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2038e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2647e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6827e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2037e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0744e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1316e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0781e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3465e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5254e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1089e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2847e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5511e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6345e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8452e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2526e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0861e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6839e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1140e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1232e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0189e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8490e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0394e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0429e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1985e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0711e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1178e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0009, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7772e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6009e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5628e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8474e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5758e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7456e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9702e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4996e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9871e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3811e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8062e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9260e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3367e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9705e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3142e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1105e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5846e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8903e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9099e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1024e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6300e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2400e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3630e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0852e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6960e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9559e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8930e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6435e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7015e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1468e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3184e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7450e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0879e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6364e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7012e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7431e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9876e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0734e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5845e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8353e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2399e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2173e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7206e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2906e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8499e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7070e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4354e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6710e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5529e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9365e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2194e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1457e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0854e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7171e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9385e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8527e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9310e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9031e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5929e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4442e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6020e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8018e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3351e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3326e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6284e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7025e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1114e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7069e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2182e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0822e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4666e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4970e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4852e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6182e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5777e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6164e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3362e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3914e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5850e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2407e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5078e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1776e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1584e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5156e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6029e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0371e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5237e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0680e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2636e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2383e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7123e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6877e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0853e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8151e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2168e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2510e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6535e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2994e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7477e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5863e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5187e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3630e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1413e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2279e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9238e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7661e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9900e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3855e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4934e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6244e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3270e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7069e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1048e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8244e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5821e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7081e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9097e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8336e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2019e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7977e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8476e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3253e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4282e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4403e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5263e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1457e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7487e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6526e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6840e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0838e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8742e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0706e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7340e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3268e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1502e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3223e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0607e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0892e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3126e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7829e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7035e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6928e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2632e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4525e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4579e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7930e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1131e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3602e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0762e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9398e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0950e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9724e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6355e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1184e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1250e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0425e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2836e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9104e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9027e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7280e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2218e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8880e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4593e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8650e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0629e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8141e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0689e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4309e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0333e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4314e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3042e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4443e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5051e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1735e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0807e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7923e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4592e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8502e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4337e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9330e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9042e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8165e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5440e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3428e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9304e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4039e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8923e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2870e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1349e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8286e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0108e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8424e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3639e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3312e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4958e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9122e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3723e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6228e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1552e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1104e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8111e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2001e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0597e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4577e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4994e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5125e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4418e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8824e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4841e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0963e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0438e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2312e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7226e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8834e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6215e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3006e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0155e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3926e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5303e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6120e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1057e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7667e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5717e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8517e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7794e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
			------------EPOCH 30---------------
Evaluating
				 {'precision': {'supports': 0.8564036222509702, 'contradicts': 0.5254237288135594, 'parts_of_same': 0.6827309236947792}, 'recall': {'supports': 0.8873994638069705, 'contradicts': 0.5516014234875445, 'parts_of_same': 0.5733558178752108}, 'f1': {'supports': 0.8716260697827518, 'contradicts': 0.5381944444444445, 'parts_of_same': 0.6232813932172319}, 'support': {'supports': 2238, 'contradicts': 281, 'parts_of_same': 593}, 'micro_avg': {'precision': 0.7972365038560412, 'recall': 0.7972365038560412, 'f1': 0.7972365038560412, 'support': None}, 'macro_avg': {'precision': 0.6881860915864362, 'recall': 0.6707855683899085, 'f1': 0.6777006358148094, 'support': None}, 'weighted_avg': {'precision': 0.793423782823035, 'recall': 0.7972365038560412, 'f1': 0.7941959027122448, 'support': None}}
Loss: tensor(6.5528e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3889e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0515e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4753e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5415e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5078e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2769e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5801e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7564e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8391e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7866e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9278e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1371e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9439e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5417e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1585e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2761e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3561e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1613e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3175e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2536e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5832e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8199e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5163e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7346e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7933e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0746e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8561e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6722e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9691e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9324e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9378e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4137e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4927e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1712e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4168e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6216e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7020e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4212e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9489e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3072e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5617e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5014e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5251e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1413e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.8183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0505e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4322e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9149e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9148e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4767e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9207e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2447e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5370e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7942e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9605e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3175e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4044e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5386e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4317e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2544e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1296e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3614e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3475e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8831e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3262e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6570e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4535e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2771e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2270e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7369e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0552e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2632e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5290e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9198e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5247e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0013, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7568e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9350e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3908e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5352e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6820e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5834e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0870e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8569e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7586e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8005e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6073e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4065e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0408e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6233e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0720e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4130e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5763e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7881e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4581e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8075e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8495e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0154e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4643e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3878e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5790e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1531e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9625e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3901e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1546e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.9778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8967e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9676e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0009e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0826e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5709e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0685e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4980e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3356e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2495e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4261e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6115e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1868e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5911e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2314e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3366e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7545e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8605e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0798e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9677e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2562e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7612e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0294e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2544e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7095e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1227e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3496e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3087e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4490e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9591e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1115e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0318e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4999e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6341e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3196e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5953e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6201e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9309e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8392e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0951e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0412e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0508e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6389e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3875e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4018e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6313e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5488e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7709e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5215e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3846e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3718e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0638e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2041e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9012e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9459e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1202e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5577e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8679e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7387e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4739e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8813e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7926e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6802e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0007, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2144e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1633e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1864e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0729e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1969e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2089e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9486e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2373e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1494e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8968e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4036e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7789e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4298e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4667e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6269e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0147e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7444e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6000e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7157e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9603e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3086e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2226e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7549e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2348e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5574e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6327e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0616e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3153e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6662e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0191e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1107e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1590e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8944e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9824e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0148e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0955e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1978e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8063e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6590e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5174e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2451e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8376e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4031e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4689e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3540e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0620e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7608e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8524e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9143e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4597e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8416e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6449e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2308e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8993e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1952e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3865e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1594e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2773e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3910e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0803e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7984e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9183e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7025e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9961e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0345e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8945e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7812e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9917e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0653e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6687e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3902e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2623e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5785e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0692e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.3376e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7931e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5991e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8716e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2950e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7719e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9839e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6614e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9748e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4851e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8028e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9516e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3898e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5798e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4395e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0641e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1135e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.0508e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2242e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1983e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3038e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9229e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5721e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2596e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4924e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8694e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4080e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3855e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9466e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0336e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4988e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6532e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2133e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8606e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7974e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8831e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6751e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8047e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6160e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0959e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4801e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6387e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9780e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4486e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4463e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1764e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5973e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1956e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8381e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0610e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7375e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6932e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4601e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2219e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2302e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0770e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9872e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8192e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5661e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7793e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6023e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7290e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8791e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6119e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5498e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2976e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6478e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8528e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5423e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4319e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9510e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2919e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1727e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8749e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3997e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4701e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8856e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6645e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4173e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0279e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6843e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8617e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2775e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8138e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1771e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0235e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5580e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2758e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.1096e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4128e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2943e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.7250e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1045e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0246e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5306e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0828e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3644e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0563e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4454e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5032e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3939e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0053e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3449e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7681e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9694e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1365e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9305e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2849e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2137e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2901e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9692e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8513e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3523e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1920e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7543e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4891e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7033e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9608e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8421e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3899e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4621e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8783e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4349e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6159e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9193e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0729e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4665e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0713e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0504e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4436e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0445e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3857e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8469e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3537e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0571e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5512e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7246e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1004e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9483e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0941e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3848e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7656e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5564e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7519e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8199e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6291e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4305e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1277e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.2318e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1323e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7747e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5209e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1060e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8626e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9237e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5388e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1126e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7745e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6252e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9685e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1453e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6363e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4217e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2743e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5210e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.9647e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3077e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3507e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0005, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5151e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9598e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4941e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0472e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5987e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3368e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2177e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6886e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7396e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1634e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9873e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1132e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8830e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4538e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4711e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9575e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8618e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3957e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7113e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7338e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8380e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1311e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9422e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2539e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3940e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6433e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0501e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.7700e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8200e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5347e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9599e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.5122e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5683e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9418e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3096e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7970e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1996e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7065e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9778e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0004, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4572e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5166e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0905e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1908e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3793e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0054e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2989e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9965e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0437e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8550e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0235e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6093e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3131e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7513e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2092e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0866e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5572e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1547e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0806e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6756e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3117e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7956e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7769e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7085e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1228e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1241e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8446e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3400e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4393e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0921e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0101e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5874e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3424e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6795e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6641e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5979e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8480e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4530e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2558e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2116e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4848e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9281e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5267e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4021e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2404e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9643e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9354e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3493e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5784e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5816e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.6276e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2088e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8139e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2700e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6071e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2588e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9555e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3893e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1768e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9223e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6979e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0481e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0274e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.8023e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9190e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3884e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0559e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5118e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8014e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0869e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4881e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.0146e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4918e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3959e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9110e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5616e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0076e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1127e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6976e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6707e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3410e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1272e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5292e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2857e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9699e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6964e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4760e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.4579e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6986e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9736e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0003, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8894e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8288e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3909e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0860e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4804e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3581e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6477e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5029e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5557e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7202e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0236e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0485e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5934e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2554e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8113e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4342e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2273e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0897e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0732e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2519e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3219e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4606e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.1775e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4913e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8875e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8968e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2067e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2720e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0553e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.3674e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9432e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6481e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1047e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3411e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.2725e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1331e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8256e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3160e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.9330e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3307e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0300e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7140e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1952e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4623e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5753e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0372e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3850e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.8425e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2409e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4662e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3680e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5213e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2514e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3504e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1619e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6296e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1484e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4704e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8961e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2469e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0328e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8008e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3981e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7427e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1766e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6938e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9176e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7837e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2255e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1815e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.7982e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1497e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.1283e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0186e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0287e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.5890e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2862e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1389e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1332e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9034e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9030e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0415e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6671e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2379e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.3433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5299e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7833e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8622e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3762e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6204e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0441e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1003e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5539e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7021e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1730e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2252e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7464e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2056e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3806e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4046e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6788e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8074e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6011e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.4756e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3082e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.8332e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9467e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.7383e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3444e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8169e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9240e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.2358e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5922e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0698e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8786e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6566e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3090e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9462e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5435e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8936e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.4124e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0323e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3263e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5405e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4433e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8738e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5725e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.6789e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7002e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1205e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6884e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1087e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.5983e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.5033e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.2813e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.1321e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.8292e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.9374e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.6659e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.2045e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9100e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2669e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.0066e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0230e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.5990e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5073e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0506e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3703e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0358e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.6083e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.4985e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1409e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9568e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.5254e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.3471e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3594e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0416e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0098e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.7975e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.7341e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.7205e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.4264e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.6385e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.9674e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6703e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0542e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3904e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.2401e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.0460e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5361e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0910e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3652e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.9167e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0005e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2888e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0329e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.6522e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.6948e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7652e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8818e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6754e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.3356e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0367e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.4892e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.4179e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9925e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0071e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.7475e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.5422e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.4728e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.5391e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.4992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.0548e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.3267e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9458e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3987e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8695e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0002, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.1430e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2668e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1210e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7109e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.7471e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(6.6257e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1972e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.3943e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.0142e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(7.0778e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1261e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(0.0001, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.2808e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.1091e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.9915e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(8.9060e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9998e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.1825e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3612e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8518e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8195e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.0359e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5461e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.2221e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8919e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.8974e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.3625e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.1301e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(2.8906e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.3992e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.5480e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.1338e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(1.2670e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(4.9056e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.0094e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(5.8107e-06, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(9.6948e-05, device='cuda:0', grad_fn=<DivBackward0>)
Loss: tensor(3.8215e-05, device='cuda:0', grad_fn=<DivBackward0>)
